# Initialize Otter
import otter
grader = otter.Notebook("model_assignment_PCA.ipynb")

import pickle
from hashlib import sha1

%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
from PIL import Image
from sklearn import datasets
from sklearn.decomposition import PCA
from sklearn.preprocessing import StandardScaler
from utils import *

conda install -c conda-forge nbconvert-playwright
jupyter nbconvert --to webpdf lab1.ipynb

# Assign the variables to either "A", "B", or "C"
W_dim = ...
Z_dim = ...
X_hat_dim = ...

grader.check("q1.1")

Z = np.array([[10, 10], [5, 2], [4, 3], [4, 3]])
W = np.array([[0.5, 0.5, -0.5, -0.5], [0.7, 0.1, 0.7, 0.1]])

Z

W

X_rows = ...
X_cols = ...

print("Number of rows:", X_rows)
print("Number of columns:", X_cols)

grader.check("q1.2.1")

# original dimensions
d = ...

# reduced_dimensions
p = ...

grader.check("q1.2.2")

X_new = np.array([[1, 1, 1, 1], [1, 0, 1, 1]])

X_new

Z_new = ...

grader.check("q1.2.3")

Z

np.random.seed(42)
outliers = np.array([[4, -3], [2.8, -3], [-3, 3]])
x1 = np.random.randn(100)
x2 = x1 + np.random.randn(100) / 2
X = np.stack([x1, x2]).T
X_noise = np.vstack([X, outliers])
X_noise_scaled = StandardScaler().fit_transform(X_noise)
plt.scatter(
    X_noise_scaled[:, 0], X_noise_scaled[:, 1], edgecolors="black", c="xkcd:azure"
);

...

recon_df = ...
recon_df

grader.check("q1.3.1")

outliers_avg_recon_error = ...
non_outliers_avg_recon_error = ...

outliers_avg_recon_error

non_outliers_avg_recon_error

grader.check("q1.3.2")

class MyPCA:
    """
    Solves the PCA problem min_Z,W (Z*W-X)^2 using SVD
    """

    def __init__(self, k):
        """
        Initializes the MyPCA instance with the specified number of components.

        Parameters
        ----------
        k : int
            The number of principal components to retain.
        """
        self.k = k

    def fit(self, X):
        """
        Computes the principal components from the dataset X using SVD.

        Parameters
        ----------
        X : np.ndarray
            The input dataset from which to compute principal components.

        Returns
        -------
        None
        """
        self.mean = np.mean(X, axis=0)
        X = X - self.mean  # Center the data
        U, S, Vt = np.linalg.svd(
            X
        )  # SVD to get singular values and principal components
        self.W = Vt[: self.k, :]  # store only first k components in self.W

    def get_components(self):
        """
        Returns the principal components obtained after fitting the model.

        Parameters
        ----------
        None

        Returns
        -------
        np.ndarray
            An array containing the top k principal components.
        """
        ### Solution_2_1
        ...

    def transform(self, X):
        """
        Transforms the dataset X into the principal component space (Z) and returns it.

        Parameters
        ----------
        X : np.ndarray
            The dataset to be transformed.

        Returns
        -------
        np.ndarray
            The dataset transformed into the principal component space.
        """
        ### Solution_2_2

        ...

    def reconstruct(self, Z):
        """
        Reconstructs the original dataset from the PCA transformed data Z.

        Parameters
        ----------
        Z : np.ndarray
            The PCA transformed data.

        Returns
        -------
        np.ndarray
            The reconstructed dataset, approximating the original dataset before transformation.
        """
        ### Solution_2_3

        ...

from sklearn.datasets import make_blobs

X, y = make_blobs(n_samples=100, centers=3, n_features=20)  ## Generating toy data

for i in range(1, X.shape[1] + 1):
    print("PCA implementation with {} components: OK".format((i)))
    pca = PCA(n_components=i)
    pca.fit(X)

    mypca = MyPCA(k=i)
    mypca.fit(X)

    assert np.allclose(
        np.abs(pca.components_), np.abs(mypca.get_components())
    ), "W values do not match"

    Z = pca.transform(X)
    Z_prime = mypca.transform(X)

    assert np.allclose(np.abs(Z), np.abs(Z_prime)), "Z values do not match"

    X_hat = pca.inverse_transform(Z)
    X_hat_prime = mypca.reconstruct(Z_prime)
    assert np.allclose(
        np.abs(X_hat), np.abs(X_hat_prime)
    ), "reconstructed X_hat values do not match"

grader.check("q2")

import pickle

animals = pickle.load(open("data/animal_faces.pkl", "rb"))

import matplotlib as mpl

mpl.rcParams.update(mpl.rcParamsDefault)
plt.rcParams["image.cmap"] = "gray"

animals.shape

fig, axes = plt.subplots(2, 5, figsize=(12, 5), subplot_kw={"xticks": (), "yticks": ()})
for image, ax in zip(animals, axes.ravel()):
    ax.imshow(image)
plt.show()

X_anims = animals.reshape(len(animals), -1)
X_anims.shape

image_shape = (100, 100)

...

...

...

cartoon_cat = 'img/cartoon_cat.png'
cartoon_img = plt.imread(cartoon_cat)
plt.imshow(cartoon_img)
plt.axis("off")
plt.show()

...

n_components = 300

pca = PCA(n_components=n_components, random_state=42)
pca.fit(X_anims)

Z = pca.transform(X_anims)
W = pca.components_
X_hat = pca.inverse_transform(Z)

Z.shape

W.shape

X_hat.shape

...

...

...

...

def img_tiling(animals, idx, size=10, image_shape=(100, 100)):
    """
    Plots a 5x5 grid of animal faces, arranged from bottom to top and left to right.

    Parameters:
    -----------
    animals : numpy.ndarray
        A collection of animal face images, where each image is represented as a flattened array.

    idx : numpy.ndarray
        A 5x5 matrix of indices, where each element corresponds to an index in `animals` representing
        the closest matching face for that grid position. The grid layout follows:
            - `idx[0, 0]` corresponds to bottom-left corner
            - `idx[0, 4]` corresponds to top-left corner
            - `idx[4, 0]` corresponds to bottom-right corner
            - `idx[4, 4]` corresponds to top-right corner

    size : int, optional (default=10)
        The figure size for the plotted grid.

    image_shape : tuple, optional (default=(100, 100))
        The expected shape of each image before plotting.

    Returns:
    --------
    None
        Displays the 5x5 grid of images.

    Notes:
    ------
    - Each selected face is reshaped to `image_shape` before being plotted.
    """
    idx = np.array(idx, dtype="int32")  # Just making sure the indexes are int

    plt.figure(figsize=(size, size))  # Creating the image with the desired size

    tile_size = 5
    # Ploting the 5x5 tiling
    for i in range(tile_size):
        for j in range(tile_size):
            face = np.reshape(
                animals[idx[i, j]], (image_shape)
            )  # Obtain the closest face
            plt.imshow(
                face, extent=(i * 32, (i + 1) * 32, j * 32, (j + 1) * 32)
            )  # Plot the closest animal face
    plt.xlim((0, 160))
    plt.ylim((0, 160))
    plt.xticks([])
    plt.yticks([])

...

import pickle
import numpy as np
import torch
from torch.utils.data import Dataset, DataLoader
from torchvision import transforms

resize_to = (64, 64)
# Load animal faces array: shape (N, H, W) or (N, H, W, C)
animals = pickle.load(open("data/animal_faces.pkl", "rb"))

if animals.ndim == 3:
    # Add a channel dimension (N, H, W) --> (N, H, W, 1) 
    animals = animals[:, :, :, None]
elif animals.ndim != 4:
    raise ValueError("Expected animals to be (N,H,W) or (N,H,W,C).")

N, H, W, C = animals.shape # C = 1 (grayscale) or 3 (RGB)

# Transform: to float [0,1] if needed , CHW tensor, and resize to 64x64
def _maybe_scale(x):
    if x.dtype == np.uint8:
        return (x / 255.0).astype(np.float32)
    return x.astype(np.float32)

# Numpy (H, W, C) --> Torch(C, H, W) float32
to_tensor = transforms.Lambda(lambda x: torch.from_numpy(x.transpose(2,0,1)).float())

# Resize to 64x64 for faster training and clean down/up-sampling steps
_resize = transforms.Resize(resize_to)


class AnimalFacesDataset(Dataset):
    def __init__(self, arr):
        self.arr = arr
    def __len__(self):
        return self.arr.shape[0]
    def __getitem__(self, idx):
        x = _maybe_scale(self.arr[idx])      # (H,W,C) in [0,1]
        x = to_tensor(x)                     # (C,H,W) float32
        x = _resize(x)                       # (C,64,64)
        return x

# Train/valid split

rng = np.random.default_rng(42)
perm = rng.permutation(N)
split = int(0.9 * N)
train_idx, valid_idx = perm[:split], perm[split:]

train_ds = AnimalFacesDataset(animals[train_idx])
valid_ds = AnimalFacesDataset(animals[valid_idx])

BATCH_SIZE = 64
trainloader = DataLoader(train_ds, batch_size=BATCH_SIZE, shuffle=True, drop_last=True)
validloader = DataLoader(valid_ds, batch_size=BATCH_SIZE, shuffle=False, drop_last=False)

in_channels = C  # 1 for grayscale, 3 for RGB
print(f"Inferred channels={in_channels}, original size=({H},{W}), resized to {resize_to}.")

# Sample image
X = next(iter(trainloader))
plt.figure(figsize=(3, 3))
plt.axis("off")
plt.imshow(X[0, 0, :, :], cmap="gray")
plt.show()

...

...

...

...

from IPython.display import Image

Image("img/eva-happy-caturday.png")

Dimensionality Reduction Adventures with Animal Faces¶

Audience and context¶

Learning objectives¶

Imports ¶

Instructions¶

Before you start¶

Before submitting¶

Submitting on Gradescope¶

Exercise 1: Warm-up¶

1.1 Dimensionality reduction notation¶

1.2 PCA by hand¶

1.2.1¶

1.2.2¶

1.2.3¶

1.2.4¶

1.3 Reconstruction error¶

1.3.1¶

1.3.2¶

Exercise 2: Implementing PCA using SVD¶

Exercise 3 Eigenfaces: PCA on animal faces¶

3.1 Varying the number of components¶

3.2 Discussion: outliers and off-distribution faces¶

Exercise 4: Interpreting the components learned by PCA¶

4.1 Visualizing strong component images¶

4.2 Visualization of first two dimensions¶

4.3 Image tiling¶

Exercise 6: Food for thought¶

(Challenging) 6.1 CNN Autoencoder on the animal faces dataset¶

Submission checklist¶