import tensorflow as tf

from tensorflow.keras import datasets, layers, models
import matplotlib.pyplot as plt

from sklearn.model_selection import train_test_split
from sklearn.preprocessing import OneHotEncoder, LabelEncoder
from sklearn.metrics import confusion_matrix

import torch
import torch.nn as nn
from torch.utils.data import DataLoader, ConcatDataset
from torchvision.datasets import ImageFolder
import torchvision.transforms as T

from seaborn import heatmap

import os, random
from PIL import Image
from IPython.display import Image as show_img, display
import PIL
import pandas as pd
import numpy as np
import requests
from bs4 import BeautifulSoup
import csv
import math


url = 'https://pokemondb.net/pokedex/game/scarlet-violet'

# Request the html from the url using the requests library
page = requests.get(url='https://pokemondb.net/pokedex/game/scarlet-violet')

# Use Beautiful Soup from bs4 to parse the html and make it more readable 
soup = BeautifulSoup(page.text, 'html.parser')
soup.prettify()

# Usually you might want to stop before this step to look at the html and 
# figure out what data you need from the html; not every website is the same
# Here we need the data in the 'span' sections of the html
soup_imgs = soup.findAll('span')
soup_text = soup.findAll('span')[9::2]

# Get all the text for each Pokémon in a list  
text_list = []

for item in soup_text:
    s = item.text.split(' ')
    text_list.append(s)

# Get only the data we need from each text block 
pokemon = []
for list in text_list:
    # Here we have some Pokémon whose names have 2 words in them,
    # so we have to adjust our appendings accordingly
    if int(list[0].replace('#','')) < 376:
        if len(list) > 3:
            pokemon.append(list[1]+','+list[2]+','+list[4])
        else:
            pokemon.append(list[1]+','+list[2])
    else:
        if len(list) > 5:
            pokemon.append(list[1]+' '+list[2]+','+list[3]+','+list[5])
        elif len(list) > 4:
            pokemon.append(list[1]+','+list[2]+','+list[4])
        else:
            pokemon.append(list[1]+','+list[2])

# Now we have just the Pokémon's name and its type to put in a new list
pokemon_list = []
for list in pokemon:
    pokemon_list.append(str(list).split(','))
    
print("This is the first 11 Pokémon in the list:")
print(pokemon_list[:10])

This is the first 11 Pokémon in the list:
[['Sprigatito', 'Grass'], ['Floragato', 'Grass'], ['Meowscarada', 'Grass', 'Dark'], ['Fuecoco', 'Fire'], ['Crocalor', 'Fire'], ['Skeledirge', 'Fire', 'Ghost'], ['Quaxly', 'Water'], ['Quaxwell', 'Water'], ['Quaquaval', 'Water', 'Fighting'], ['Lechonk', 'Normal']]


# Read the old csv
pm = pd.read_csv('pokemons.csv')

# Drop all columns we will not be using
pm = pm.drop(['NationalNumber','Normal',"Fire","Water","Electric","Grass","Fighting","Poison","Bug","Ice","Ground","Flying","Psychic","Rock","Ghost","Dragon","Dark","Steel","Fairy"],axis=1)

# Make a list of only new Pokémon from our other list
to_add = []
for pokemon in pokemon_list:
    if pokemon[0] not in pm['Pokemon'].values:
        to_add.append(pokemon)

for lst in to_add:
    if len(lst) < 3:
        lst.append('NaN')

# Add each Pokémon to the dataframe
for i in range(0,len(to_add)):
    pm.loc[894+i] = to_add[i]

# replace any NaN strings with actuall NaN
for row in pm:
    for val in row:
        if val =="NaN":
            pm[row[val]] = math.isnan(float(val))

# Write the dataframe to a new csv
pm.to_csv('./Pokemon_to_gen_9.csv')


# Find all images in the html, the first image is the website header in 
# this case so we skip that one
soup_imgs = soup.findAll('img')[1:]

# Get a list of tuples of the html containing the Pokémon names and urls for each Pokémon
images = []
for i in range(0,len(soup_imgs)):
    soup_imgs[i] = str(soup_imgs[i]).split(' ')
    if len(soup_imgs[i]) == 7: # Pokémon has 2 word name
        images.append([soup_imgs[i][1]+" "+soup_imgs[i][2],soup_imgs[i][6]])
    else: # one word name
        images.append([soup_imgs[i][1],soup_imgs[i][5]])

# Break that list into names and urls that correlate by index and get only the names and urls
names = []
urls = []
for i in range(0, len(images)):
    names.append(images[i][0].replace("alt=\"", '').replace("\"", ''))
    urls.append(images[i][1].replace('src=\"', '').replace("\"/>",''))

# Make the list of Pokémon names and images to be added since we already have the 
# Pokémon from previous generations (i.e. take out the repeated Pokémon)
images1 = []
# 376-387, 397,398 => indexes 375-386,396,397 have 2 word names
for i in range(0,len(names)): 
    if names[i] not in pm['Pokemon'].values:
        if i > 374 and i < 387:
            images1.append([names[i], urls[i]])
        else:
            images1.append([names[i], urls[i]])


# List to catch and keep track of any image urls that don't work 
broken_images = []
for img in images1:
    # directory to save images into
    directory = './images1/'
    # if there is a space in the name to be saved
    file_name = img[0].replace(' ','-') + '.png'
    file_path = directory+file_name
    # img[1] is the url of the image
    r = requests.get(img[1], stream=True)
    # status code 200 indicates a successful request
    if r.status_code == 200:
        with open(file_path, 'wb') as f:
            for chunk in r:
                f.write(chunk)
    else:
        broken_images.append(img)


# Load dataframe from csv
df = pd.read_csv("Pokemon_to_gen_9.csv")
df = df.sort_values(by="Pokemon")


# Load images
# TODO: Integrate the gen 8 and 9 dataset
images = np.zeros((df.shape[0], 120, 120, 3), dtype=np.uint8) # If you change the datatype, it gets messed up
index = 0
for image in os.listdir("data\\images_with_gen_9"):
    img = Image.open("data\\images_with_gen_9\\" + image)
    newimg = Image.new('RGB', img.size, (255, 255, 255))
    newimg.paste(img, None)
    newimg.thumbnail((120, 120))
    data = np.asarray(newimg)
    images[index] = data
    index += 1

c:\Users\justi\AppData\Local\Programs\Python\Python310\lib\site-packages\PIL\Image.py:979: UserWarning: Palette images with Transparency expressed in bytes should be converted to RGBA images
  warnings.warn(


labels = df["Type_1"].to_numpy().reshape((-1, 1))

onehot_encoder = OneHotEncoder(sparse=False)
onehot_encoded = onehot_encoder.fit_transform(labels)


X_train, X_test, y_train, y_test = train_test_split(images, onehot_encoded, test_size=0.2)
X_train = X_train / 255.0
X_test = X_test / 255.0


model = models.Sequential()

model.add(layers.Conv2D(128, (6, 6), activation='relu', input_shape=(120, 120, 3)))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Dropout(0.25))
model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Dropout(0.25))
model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Conv2D(32, (4, 4), activation='relu'))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Conv2D(64, (3, 3), activation='relu'))
model.add(layers.MaxPooling2D((2, 2)))
model.add(layers.Dropout(0.4))


model.add(layers.Flatten())
model.add(layers.Dense(64, activation='relu'))
model.add(layers.Dense(18, activation='softmax'))

model.summary()

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 conv2d (Conv2D)             (None, 115, 115, 128)     13952     
                                                                 
 max_pooling2d (MaxPooling2D  (None, 57, 57, 128)      0         
 )                                                               
                                                                 
 dropout (Dropout)           (None, 57, 57, 128)       0         
                                                                 
 conv2d_1 (Conv2D)           (None, 55, 55, 64)        73792     
                                                                 
 max_pooling2d_1 (MaxPooling  (None, 27, 27, 64)       0         
 2D)                                                             
                                                                 
 dropout_1 (Dropout)         (None, 27, 27, 64)        0         
                                                                 
 conv2d_2 (Conv2D)           (None, 25, 25, 64)        36928     
                                                                 
 max_pooling2d_2 (MaxPooling  (None, 12, 12, 64)       0         
 2D)                                                             
                                                                 
 conv2d_3 (Conv2D)           (None, 9, 9, 32)          32800     
                                                                 
 max_pooling2d_3 (MaxPooling  (None, 4, 4, 32)         0         
 2D)                                                             
                                                                 
 conv2d_4 (Conv2D)           (None, 2, 2, 64)          18496     
                                                                 
 max_pooling2d_4 (MaxPooling  (None, 1, 1, 64)         0         
 2D)                                                             
                                                                 
 dropout_2 (Dropout)         (None, 1, 1, 64)          0         
                                                                 
 flatten (Flatten)           (None, 64)                0         
                                                                 
 dense (Dense)               (None, 64)                4160      
                                                                 
 dense_1 (Dense)             (None, 18)                1170      
                                                                 
=================================================================
Total params: 181,298
Trainable params: 181,298
Non-trainable params: 0
_________________________________________________________________


model.compile(optimizer='adam',
              loss=tf.keras.losses.CategoricalCrossentropy(from_logits=False),
              metrics=['accuracy'])


history = model.fit(X_train, y_train, epochs=30, 
                    validation_data=(X_test, y_test))

Epoch 1/30
25/25 [==============================] - 29s 1s/step - loss: 2.8333 - accuracy: 0.0892 - val_loss: 2.8160 - val_accuracy: 0.1250
Epoch 2/30
25/25 [==============================] - 28s 1s/step - loss: 2.7799 - accuracy: 0.0992 - val_loss: 2.7763 - val_accuracy: 0.1250
Epoch 3/30
25/25 [==============================] - 27s 1s/step - loss: 2.7650 - accuracy: 0.1269 - val_loss: 2.7812 - val_accuracy: 0.1100
Epoch 4/30
25/25 [==============================] - 28s 1s/step - loss: 2.7288 - accuracy: 0.1168 - val_loss: 2.7432 - val_accuracy: 0.1150
Epoch 5/30
25/25 [==============================] - 28s 1s/step - loss: 2.7544 - accuracy: 0.1382 - val_loss: 2.7653 - val_accuracy: 0.1250
Epoch 6/30
25/25 [==============================] - 27s 1s/step - loss: 2.7453 - accuracy: 0.1206 - val_loss: 2.7435 - val_accuracy: 0.1400
Epoch 7/30
25/25 [==============================] - 28s 1s/step - loss: 2.6958 - accuracy: 0.1570 - val_loss: 2.7081 - val_accuracy: 0.1650
Epoch 8/30
25/25 [==============================] - 31s 1s/step - loss: 2.6709 - accuracy: 0.1734 - val_loss: 2.7511 - val_accuracy: 0.0950
Epoch 9/30
25/25 [==============================] - 27s 1s/step - loss: 2.6429 - accuracy: 0.1822 - val_loss: 2.6886 - val_accuracy: 0.1450
Epoch 10/30
25/25 [==============================] - 29s 1s/step - loss: 2.5927 - accuracy: 0.1985 - val_loss: 2.6755 - val_accuracy: 0.1450
Epoch 11/30
25/25 [==============================] - 28s 1s/step - loss: 2.5748 - accuracy: 0.1960 - val_loss: 2.6530 - val_accuracy: 0.1500
Epoch 12/30
25/25 [==============================] - 29s 1s/step - loss: 2.5622 - accuracy: 0.2048 - val_loss: 2.7139 - val_accuracy: 0.1500
Epoch 13/30
25/25 [==============================] - 28s 1s/step - loss: 2.5594 - accuracy: 0.2111 - val_loss: 2.6558 - val_accuracy: 0.1650
Epoch 14/30
25/25 [==============================] - 28s 1s/step - loss: 2.5178 - accuracy: 0.2085 - val_loss: 2.6565 - val_accuracy: 0.1600
Epoch 15/30
25/25 [==============================] - 28s 1s/step - loss: 2.4908 - accuracy: 0.2173 - val_loss: 2.6749 - val_accuracy: 0.1850
Epoch 16/30
25/25 [==============================] - 3497s 146s/step - loss: 2.4696 - accuracy: 0.2425 - val_loss: 2.7792 - val_accuracy: 0.1950
Epoch 17/30
25/25 [==============================] - 36s 1s/step - loss: 2.4364 - accuracy: 0.2286 - val_loss: 2.7056 - val_accuracy: 0.2000
Epoch 18/30
25/25 [==============================] - 36s 1s/step - loss: 2.4474 - accuracy: 0.2312 - val_loss: 2.6667 - val_accuracy: 0.2050
Epoch 19/30
25/25 [==============================] - 33s 1s/step - loss: 2.3808 - accuracy: 0.2462 - val_loss: 2.6910 - val_accuracy: 0.1600
Epoch 20/30
25/25 [==============================] - 32s 1s/step - loss: 2.3190 - accuracy: 0.2626 - val_loss: 2.6669 - val_accuracy: 0.1900
Epoch 21/30
25/25 [==============================] - 30s 1s/step - loss: 2.2413 - accuracy: 0.2802 - val_loss: 2.8163 - val_accuracy: 0.1800
Epoch 22/30
25/25 [==============================] - 28s 1s/step - loss: 2.1701 - accuracy: 0.2864 - val_loss: 2.8253 - val_accuracy: 0.1400
Epoch 23/30
25/25 [==============================] - 28s 1s/step - loss: 2.1007 - accuracy: 0.3304 - val_loss: 2.8053 - val_accuracy: 0.1750
Epoch 24/30
25/25 [==============================] - 33s 1s/step - loss: 2.0370 - accuracy: 0.3417 - val_loss: 2.9711 - val_accuracy: 0.1600
Epoch 25/30
25/25 [==============================] - 31s 1s/step - loss: 1.9295 - accuracy: 0.3794 - val_loss: 2.9420 - val_accuracy: 0.1900
Epoch 26/30
25/25 [==============================] - 30s 1s/step - loss: 1.8247 - accuracy: 0.4183 - val_loss: 3.1224 - val_accuracy: 0.1350
Epoch 27/30
25/25 [==============================] - 30s 1s/step - loss: 1.7995 - accuracy: 0.4070 - val_loss: 3.2105 - val_accuracy: 0.1450
Epoch 28/30
25/25 [==============================] - 29s 1s/step - loss: 1.7326 - accuracy: 0.4410 - val_loss: 2.9188 - val_accuracy: 0.1650
Epoch 29/30
25/25 [==============================] - 29s 1s/step - loss: 1.6075 - accuracy: 0.4824 - val_loss: 3.2015 - val_accuracy: 0.1550
Epoch 30/30
25/25 [==============================] - 29s 1s/step - loss: 1.4827 - accuracy: 0.5415 - val_loss: 3.4270 - val_accuracy: 0.1450


y_predict = model.predict(X_test)

7/7 [==============================] - 2s 161ms/step


confusion = confusion_matrix(np.argmax(y_test, axis=1), np.argmax(y_predict, axis=1))
heatmap(confusion, annot=True, xticklabels=list(onehot_encoder.categories_[0]), yticklabels=list(onehot_encoder.categories_[0]), fmt="g")
plt.xlabel("Predicted type")
plt.ylabel("True type")
plt.show()


for i in range(len(onehot_encoder.categories_[0])):
    binary_y_test = [True if np.argmax(y) == i else False for y in y_test]
    binary_y_predict = [True if i in np.argsort(y)[-3:] else False for y in y_predict]
    confusion = confusion_matrix(y_true=binary_y_test, y_pred=binary_y_predict, labels=[True, False])
    heatmap(confusion, annot=True, xticklabels=[True, False], yticklabels=[True, False], fmt="g")
    plt.title(onehot_encoder.categories_[0][i])
    plt.xlabel("Top 3 predicted types")
    plt.ylabel("True type")
    plt.show()


IMAGE_DIR = 'data/'
image_size = 64
batch_size = 4
normalization_stats = (0.5, 0.5, 0.5), (0.5, 0.5, 0.5) # Convert channels from [0, 1] to [-1, 1]


normal_dataset = ImageFolder(IMAGE_DIR, transform=T.Compose([
    T.Resize(image_size),
    T.CenterCrop(image_size),
    T.ToTensor(),
    T.Normalize(*normalization_stats)]))

# Augment the dataset with mirrored images
mirror_dataset = ImageFolder(IMAGE_DIR, transform=T.Compose([
    T.Resize(image_size),
    T.CenterCrop(image_size),
    T.RandomHorizontalFlip(p=1.0),
    T.ToTensor(),
    T.Normalize(*normalization_stats)]))

# Combine the datasets
dataset_list = [normal_dataset, mirror_dataset]
dataset = ConcatDataset(dataset_list)

dataloader = DataLoader(dataset, batch_size, shuffle=True, num_workers=4, pin_memory=False)


dis = nn.Sequential(
  # Input is 3 x 64 x 64
  nn.Conv2d(3, 64, kernel_size=4, stride=2, padding=1, bias=False),
  nn.BatchNorm2d(64),
  nn.LeakyReLU(0.2, inplace=True),
  # Layer Output: 64 x 32 x 32
  
  nn.Conv2d(64, 128, kernel_size=4, stride=2, padding=1, bias=False),
  nn.BatchNorm2d(128),
  nn.LeakyReLU(0.2, inplace=True),
  # Layer Output: 128 x 16 x 16
  
  nn.Conv2d(128, 128, kernel_size=4, stride=2, padding=1, bias=False),
  nn.BatchNorm2d(128),
  nn.LeakyReLU(0.2, inplace=True),
  # Layer Output: 128 x 8 x 8
  
  nn.Conv2d(128, 128, kernel_size=4, stride=2, padding=1, bias=False),
  nn.BatchNorm2d(128),
  nn.LeakyReLU(0.2, inplace=True),
  # Layer Output: 128 x 4 x 4
  
  # With a 4x4, we can condense the channels into a 1 x 1 x 1 to produce output
  nn.Conv2d(128, 1, kernel_size=4, stride=1, padding=0, bias=False),
  nn.Flatten(),
  nn.Sigmoid()
)


seed_size = 16

gen = nn.Sequential(
  # Input seed_size x 1 x 1
  nn.ConvTranspose2d(seed_size, 128, kernel_size=4, padding=0, stride=1, bias=False),
  nn.BatchNorm2d(128),
  nn.ReLU(True),
  # Layer output: 256 x 4 x 4
  
  nn.ConvTranspose2d(128, 128, kernel_size=4, padding=1, stride=2, bias=False),
  nn.BatchNorm2d(128),
  nn.ReLU(True),
  # Layer output: 128 x 8 x 8
  
  nn.ConvTranspose2d(128, 128, kernel_size=4, padding=1, stride=2, bias=False),
  nn.BatchNorm2d(128),
  nn.ReLU(True),
  # Layer output: 64 x 16 x 16
  
  nn.ConvTranspose2d(128, 64, kernel_size=4, padding=1, stride=2, bias=False),
  nn.BatchNorm2d(64),
  nn.ReLU(True),
  # Layer output: 32 x 32 x 32
  
  nn.ConvTranspose2d(64, 3, kernel_size=4, padding=1, stride=2, bias=False),
  nn.Tanh()
  # Output: 3 x 64 x 64
)


def get_training_device():
    # Use the GPU if possible
    if torch.cuda.is_available():
        return torch.device('cuda')
    # Otherwise use the CPU :-(
    return torch.device('cpu')

def to_device(data, device):
    # This moves the tensors to the device (GPU, CPU)
    if isinstance(data, (list,tuple)):
        return [to_device(x, device) for x in data]
    return data.to(device, non_blocking=True)

class DeviceDataLoader():
    """Wrap a dataloader to move data to a device"""
    def __init__(self, dataloader, device):
        self.dataloader = dataloader
        self.device = device
        
    def __iter__(self):
        """Yield a batch of data after moving it to device"""
        for b in self.dataloader: 
            yield to_device(b, self.device)

    def __len__(self):
        """Number of batches"""
        return len(self.dataloader)


device = get_training_device()
device

device(type='cuda')


dev_dataloader = DeviceDataLoader(dataloader, device)


def train_discriminator(real_pokemon, disc_optimizer):
    # Reset the gradients for the optimizer
    disc_optimizer.zero_grad()
    
    # Train on the real images
    real_predictions = discriminator(real_pokemon)
    real_targets = torch.rand(real_pokemon.size(0), 1, device=device) * (0.1 - 0) + 0
    real_loss = F.binary_cross_entropy(real_predictions, real_targets)
    real_score = torch.mean(real_predictions).item()
    
    # Make some latent tensors to seed the generator
    latent_batch = torch.randn(batch_size, seed_size, 1, 1, device=device)
    
    # Get some fake pokemon
    fake_pokemon = generator(latent_batch)
    
    # Train on the generator's current efforts to trick the discriminator
    gen_predictions = discriminator(fake_pokemon)
    gen_targets = torch.rand(fake_pokemon.size(0), 1, device=device) * (1 - 0.9) + 0.9
    gen_loss = F.binary_cross_entropy(gen_predictions, gen_targets)
    gen_score = torch.mean(gen_predictions).item()
    
    # Update the discriminator weights using backpropagation
    total_loss = real_loss + gen_loss
    total_loss.backward()
    disc_optimizer.step()

    # Return discriminator loss and scores from the real data and generator data
    return total_loss.item(), real_score, gen_score


def train_generator(gen_optimizer):
    # Clear the generator gradients
    gen_optimizer.zero_grad()
    
    # Generate some fake pokemon
    latent_batch = torch.randn(batch_size, seed_size, 1, 1, device=device)
    fake_pokemon = generator(latent_batch)
    
    # Test against the discriminator
    disc_predictions = discriminator(fake_pokemon)
    targets = torch.zeros(fake_pokemon.size(0), 1, device=device)
    loss = F.binary_cross_entropy(disc_predictions, targets)
    
    # Update the generator based on how well it did against the discriminator using backpropgation
    loss.backward()
    gen_optimizer.step()
    
    # Return generator loss
    return loss.item()


import os
from torchvision.utils import save_image

RESULTS_DIR = 'Results/'
os.makedirs(RESULTS_DIR, exist_ok=True)


import torch
from torchvision.utils import make_grid
import matplotlib.pyplot as plt
%matplotlib inline


# Reverse the normilzation of images so we can see the visuals properly
def denorm(image):
    return image * normalization_stats[1][0] + normalization_stats[0][0]
def show_images(images, nmax=64):
    fig, ax = plt.subplots(figsize=(8, 8))
    ax.set_xticks([]); ax.set_yticks([])
    ax.imshow(make_grid(denorm(images.detach()[:nmax]), nrow=8).permute(1, 2, 0))
def show_batch(dataloader, nmax=64):
    for images, _ in dataloader:
        show_images(images, nmax)
        break


def save_results(index, latent_batch, show=True):
    # Generate fake pokemon
    fake_pokemon = generator(latent_batch)
    
    # Make the filename for the output
    fake_file = "result_image_for_epoch-{0:0=4d}.png".format(index)
    
    # Save the image
    save_image(denorm(fake_pokemon), os.path.join(RESULTS_DIR, fake_file), nrow=8)
    print("Result Saved!")
    
    if show:
        fig, ax = plt.subplots(figsize=(10, 10))
        ax.set_xticks([]); ax.set_yticks([])
        ax.imshow(make_grid(fake_pokemon.cpu().detach(), nrow=8).permute(1, 2, 0))


import torch.nn.functional as F

# Static generation seed batch
fixed_latent_batch = torch.randn(64, seed_size, 1, 1, device=device)

def train(epochs, learning_rate, start_idx=1):
    # Empty the GPU cache to save some memory
    torch.cuda.empty_cache()
    
    # Track losses and scores
    disc_losses = []
    disc_scores = []
    gen_losses = []
    gen_scores = []
    
    # Create the optimizers
    disc_optimizer = torch.optim.Adam(discriminator.parameters(), lr=learning_rate, betas=(0.5, 0.9))
    gen_optimizer = torch.optim.Adam(generator.parameters(), lr=learning_rate, betas=(0.5, 0.9))
    
    # Run the loop
    for epoch in range(epochs):
        # Go through each image
        for real_img, _ in dev_dataloader:
            # Train the discriminator
            disc_loss, real_score, gen_score = train_discriminator(real_img, disc_optimizer)

            # Train the generator
            gen_loss = train_generator(gen_optimizer)
        
        # Collect results
        disc_losses.append(disc_loss)
        disc_scores.append(real_score)
        gen_losses.append(gen_loss)
        gen_scores.append(gen_score)
        
        # Print the losses and scores
        print("Epoch [{}/{}], gen_loss: {:.4f}, disc_loss: {:.4f}, real_score: {:.4f}, gen_score: {:.4f}".format(
            epoch+start_idx, epochs, gen_loss, disc_loss, real_score, gen_score))
        
        # Save the images and show the progress
        save_results(epoch + start_idx, fixed_latent_batch, show=False)
    
    # Return stats
    return disc_losses, disc_scores, gen_losses, gen_scores


# Set the discriminator to device
discriminator = to_device(dis, device)

# Set the generator to device
generator = to_device(gen, device)


# initial hyperparameters: lr = 0.002, epochs = 50
learning_rate = 0.002
epochs = 50


discriminator.load_state_dict(torch.load("gan-checkpoints\\discriminator-model.pth"))
generator.load_state_dict(torch.load("gan-checkpoints\\generator-model.pth"))

<All keys matched successfully>


show_img('Results/result_image_for_epoch-0001.png')


show_img('Results/result_image_for_epoch-0025.png')


show_img('Results/result_image_for_epoch-0050.png')


# Extract metrics
disc_losses, disc_scores, gen_losses, gen_scores = history


# Plot generator and discriminator losses
plt.plot(disc_losses, '-')
plt.plot(gen_losses, '-')
plt.xlabel('Epoch')
plt.ylabel('Loss')
plt.legend(['Discriminator', 'Generator'])
plt.title('Losses')


# Save generator and discriminator weights
torch.save(discriminator.state_dict(), 'discriminator-model.pth')
torch.save(generator.state_dict(), 'generator-model.pth')

Pokémon Type Identifier¶

Introduction¶

Motivation¶

Data Collection¶

Convolutional Neural Network¶

Preprocessing the Data¶

Constructing the Model¶

Training the Model¶

Viewing Results¶

Building a General Adversarial Network (GAN)¶

Motivation for the GAN¶

What are GANs?¶

Designing the Discriminator¶

Designing the Generator¶

GPU Setup¶

Training Functions¶

Discriminator¶

Generator¶

Results¶

Run Training¶

Selecting Models¶

Training Time¶

Results¶

Performance Analysis¶

Saving Model Weights¶

Conclusions¶