Create script for t-SNE visualization of samples

ThanosM97 · Jul 17, 2022 · ce105fe · ce105fe
1 parent e5e216d
commit ce105fe
Showing 1 changed file with 227 additions and 0 deletions.
diff --git a/tsne.py b/tsne.py
@@ -0,0 +1,227 @@
+"""
+This module creates a t-SNE visualization of generated images 
+to qualitatively examine the generator's distribution and evaluate the 
+diversity in terms of the generated samples. In particular, it uses the
+pre-trained VGG-19 model to extract features (4096d) of from the generated 
+images, which are then compressed to 300d using the PCA algorithm.
+Subsequently, the t-SNE algorithm is used to map those pca features to two
+dimensions, which are then ploted in an image grid, with images placed in 
+neighboring tiles based on their similarity distance.
+"""
+import argparse
+
+import matplotlib.pyplot as plt
+import numpy as np
+import rasterfairy
+import torch
+from matplotlib.patches import Patch
+from matplotlib.pyplot import imshow
+from PIL import Image, ImageOps
+from seaborn import color_palette
+from sklearn.decomposition import PCA
+from sklearn.manifold import TSNE
+from torch.utils.data import DataLoader
+from torchvision import transforms
+from torchvision.datasets import ImageFolder
+from torchvision.models import vgg19
+from torchvision.models.feature_extraction import create_feature_extractor
+from tqdm import tqdm
+
+
+def factors(num: int) -> "tuple[int,int]":
+    """Return `num`'s two closer factors to its square root."""
+    ny = int(np.ceil(np.sqrt(num)))
+    nx = int(num/ny)
+    while nx * ny != num:
+        ny -= 1
+        nx = int(num/ny)
+    return nx, ny
+
+
+def get_colors(nclasses: int) -> "tuple[color_palette, list]":
+    """Return an sns color_palette and the corresponding RGB colors in [0,255].
+
+    Args:
+        - nclasses (int) : number of classes in the samples
+    """
+    palette = color_palette(n_colors=nclasses)
+    colors = []
+    for color in palette:
+        rgb_color = [int(val*255) for val in color]
+        colors.append(tuple(rgb_color))
+
+    return palette, colors
+
+
+def get_loader(path: str, batch_size: int) -> "tuple[DataLoader, int]":
+    """Return a dataloader and the corresponding number of classes found.
+
+    This function uses PyTorch's ImageFolder to create a dataset. It returns
+    the dataloader and the number of classes found in `path`.
+
+    Args:
+        - path (str) : path to generated samples 
+                       (format: dir/{class-0, class-1, ...}/image_X.png)
+        - batch_size (int) : number of samples per batch
+    """
+    data = ImageFolder(path, transforms.ToTensor())
+    nclasses = len(data.classes)
+    dataloader = DataLoader(
+        data,
+        batch_size=batch_size,
+        shuffle=True,
+        drop_last=False
+    )
+    return dataloader, nclasses
+
+
+def pca(features: torch.Tensor, components: int = 300) -> np.array:
+    """Calculate and return PCA features for `components` dimensions.
+
+    Args:
+        - features (Tensor) : extracted features from VGG-19
+        - components (int, optional) : number of components to use in PCA
+                                       (Default: 300)
+    """
+    features = np.array(features)
+    pca_model = PCA(n_components=components)
+    pca_model.fit(features)
+    pca_features = pca_model.transform(features)
+
+    return np.array(pca_features)
+
+
+def visualize(args: argparse.Namespace):
+    """Create t-SNE visualization of the dataset in `path` directory.
+
+    This function creates a t-SNE visualization of the dataset in `path`
+    directory and saves it as `filename`.png .
+
+    Args:
+        - args.path (str) : path to the directory of the generated images. 
+                            The directory should have the following format:
+                                dir/{class-0, class-1, ...}/image_X.png)
+        - args.filename (str) : filename for the .png file
+        - args.nsamples (int) : number of samples to use from each class
+        - args.title (str, optional) : title for the image 
+                                       (Default: t-SNE visualization)
+        - args.batch_size (int, optional) : number of samples per batch
+                                            (Default: 32)
+    """
+    # Load pretrained vgg19 model
+    model = vgg19(weights="VGG19_Weights.DEFAULT").eval()
+
+    # Define feature extractor
+    feature_extractor = create_feature_extractor(
+        model, return_nodes=['classifier.3'])
+
+    # Get dataloader
+    dataloader, nclasses = get_loader(args.path, args.batch_size)
+
+    total_samples = nclasses * args.nsamples
+
+    if total_samples > len(dataloader.dataset):
+        print((f"[ERROR] Not enough samples generated. (total_samples_found" +
+               f"={len(dataloader.dataset)})"))
+        exit(1)
+
+    # Extract features using VGG19
+    images = torch.Tensor()
+    features = torch.Tensor()
+    labels = torch.Tensor()
+
+    batches = total_samples//args.batch_size
+    with tqdm(total=batches, desc="Extracting features") as pbar:
+        for i, (img, label) in enumerate(dataloader):
+            with torch.no_grad():
+                features = torch.cat(
+                    [features, feature_extractor(img)['classifier.3']],
+                    dim=0)
+                images = torch.cat(
+                    [images, img],
+                    dim=0)
+                labels = torch.cat(
+                    [labels, label],
+                    dim=0)
+
+            if (i+1)*args.batch_size > total_samples:
+                features = features[:total_samples]
+                images = images[:total_samples]
+                labels = labels[:total_samples]
+                break
+
+            pbar.update(1)
+
+    # Get PCA features
+    pca_features = pca(features)
+
+    # TSNE transformation
+    tsne = TSNE(n_components=2, learning_rate=150, perplexity=30, angle=0.2,
+                init="random", verbose=1).fit_transform(pca_features)
+
+    # Image configurations
+    palette, colors = get_colors(nclasses)
+    nx, ny = factors(total_samples)
+    tile_width = images.shape[-1] + 6  # + 6 pixels for the border
+    tile_height = images.shape[-2] + 6
+    full_width = tile_width * nx
+    full_height = tile_height * ny
+
+    # Assign to grid
+    grid = rasterfairy.transformPointCloud2D(tsne, target=(nx, ny))
+    grid_image = Image.new('RGB', (full_width, full_height))
+
+    # Create image
+    for img, label, grid_pos in zip(images, labels, grid[0]):
+        idx_x, idx_y = grid_pos
+        x, y = tile_width * idx_x, tile_height * idx_y
+
+        # Add color borders to images for class identification
+        tile = transforms.ToPILImage()(img)
+        tile = ImageOps.expand(tile, border=3, fill=colors[int(label.item())])
+
+        grid_image.paste(tile, (int(x), int(y)))
+
+    plt.figure(figsize=(16, 12))
+    imshow(grid_image)
+
+    legend_elements = [Patch(facecolor="w", edgecolor=palette[i],
+                             label=f'Class {i}') for i in range(nclasses)]
+    plt.legend(
+        handles=legend_elements, loc='center left', bbox_to_anchor=(1, 0.5))
+
+    plt.title(args.title)
+    plt.savefig(args.filename+".png")
+
+    print("Done.")
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(
+        description="t-SNE visualization of generated samples")
+
+    parser.add_argument(
+        '-p', '--path', required=True, type=str, dest='path',
+        help=('Path to the directory of the generated images. ' +
+              'The directory should have the following format: ' +
+              'dir/{class-0, class-1, ...}/image_X.png)'))
+
+    parser.add_argument('-f', '--filename', required=True,
+                        type=str, dest='filename',
+                        help='Filename for the .png file.')
+
+    parser.add_argument('-n', '--nsamples', required=True,
+                        type=int, dest='nsamples',
+                        help='Number of samples to use from each class.')
+
+    parser.add_argument('-t', '--title', default='t-SNE visualization',
+                        type=str, dest='title',
+                        help='Title for the image.')
+
+    parser.add_argument('-b', '--batch_size', default=32,
+                        type=int, dest='batch_size',
+                        help='Number of samples per batch.')
+
+    args = parser.parse_args()
+
+    visualize(args)