import matplotlib.pyplot as plt
import pandas as pd


data = pd.read_csv("https://raw.githubusercontent.com/oseledets/nla2022/main/hw1/molecules.csv", index_col=0)
data.head()


molecules = data.to_numpy().reshape(len(data), 5, 2)
molecules.shape

(500, 5, 2)


def draw_molecule(ax, molecule):
    ax.scatter(*molecule.T, color="black", s=50)
    for i in range(1, molecule.shape[0]):
        ax.plot(*molecule[[0, i], :].T, color="black")
    ax.axis("off")
    ax.axis("equal")


k = 5
fig, ax = plt.subplots(k, k, figsize=(2*k, 2*k))
ax = ax.reshape(-1,)
for i in range(k**2):
    draw_molecule(ax[i], molecules[i])


#your solution


#your solution


#your solution


#your solution


!pip install functorch


import torch
from torch import nn
import requests
import matplotlib.pyplot as plt
import numpy as np
from torchvision import utils as vutils
from torchvision import transforms
from tqdm import tqdm
from google.colab import files
from functorch import vmap, jacfwd, jacrev
from functorch.experimental import replace_all_batch_norm_modules_


device = "cuda:0" if torch.cuda.is_available() else "cpu"
#   hidden generator size
ngf = 64

# Number of channels in the training images. For color images this is 3
nc = 3

# Size of z latent vector (i.e. size of generator input)
nz = 100

print(f"Device: {device}, latent size {nz}, generator hidden dim {ngf}, number of image channels {nc}")


def download_file_from_google_drive(id, destination):
    URL = "https://docs.google.com/uc?export=download"

    session = requests.Session()

    response = session.get(URL, params = { 'id' : id }, stream = True)
    token = get_confirm_token(response)

    if token:
        params = { 'id' : id, 'confirm' : token }
        response = session.get(URL, params = params, stream = True)

    save_response_content(response, destination)    

def get_confirm_token(response):
    for key, value in response.cookies.items():
        if key.startswith('download_warning'):
            return value

    return None

def save_response_content(response, destination):
    CHUNK_SIZE = 32768

    with open(destination, "wb") as f:
        for chunk in response.iter_content(CHUNK_SIZE):
            if chunk: # filter out keep-alive new chunks
                f.write(chunk)


class Generator(nn.Module):
    def __init__(self, ngpu):
        super(Generator, self).__init__()
        self.ngpu = ngpu
        self.main = nn.Sequential(
            # input is Z, going into a convolution
            nn.ConvTranspose2d( nz, ngf * 8, 4, 1, 0, bias=False),
            nn.BatchNorm2d(ngf * 8),
            nn.ReLU(True),
            # state size. (ngf*8) x 4 x 4
            nn.ConvTranspose2d(ngf * 8, ngf * 4, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ngf * 4),
            nn.ReLU(True),
            # state size. (ngf*4) x 8 x 8
            nn.ConvTranspose2d( ngf * 4, ngf * 2, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ngf * 2),
            nn.ReLU(True),
            # state size. (ngf*2) x 16 x 16
            nn.ConvTranspose2d( ngf * 2, ngf, 4, 2, 1, bias=False),
            nn.BatchNorm2d(ngf),
            nn.ReLU(True),
            # state size. (ngf) x 32 x 32
            nn.ConvTranspose2d( ngf, nc, 4, 2, 1, bias=False),
            nn.Tanh()
            # state size. (nc) x 64 x 64
        )
    def get_function_output(self, inp, index=0):
      if index == 0:
        inp = inp[:,:,None,None]
      return self.main[index](inp)
    def get_number_of_layers(self):
      return len(self.main)

    def forward(self, input):
        return self.main(input[:,:,None,None])


file_id = "1hIh2-8KjcUku1Dl-mLYqEObbODrCW_Fp"
destination = './G_checkpoint.pt'
download_file_from_google_drive(file_id, destination)
G = Generator(1).to(device)
G.load_state_dict(torch.load('./G_checkpoint.pt', map_location="cpu"))
replace_all_batch_norm_modules_(G)


def sample_batch(batch_size):
  return torch.randn((batch_size,nz),device=device)


def ToPILImage(tensor):
  return transforms.ToPILImage()(tensor)


def ConvertTensorsToOne(tensor, nrow=None):
  if nrow is None:
    nrow = int(tensor.size(0) ** 0.5)
  return vutils.make_grid(tensor, padding=2, normalize=True, nrow=nrow).cpu()


# generator model consist of 14 functions numbered from 0 to 13

G

Generator(
  (main): Sequential(
    (0): ConvTranspose2d(100, 512, kernel_size=(4, 4), stride=(1, 1), bias=False)
    (1): BatchNorm2d(512, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU(inplace=True)
    (3): ConvTranspose2d(512, 256, kernel_size=(4, 4), stride=(2, 2), padding=(1, 1), bias=False)
    (4): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (5): ReLU(inplace=True)
    (6): ConvTranspose2d(256, 128, kernel_size=(4, 4), stride=(2, 2), padding=(1, 1), bias=False)
    (7): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (8): ReLU(inplace=True)
    (9): ConvTranspose2d(128, 64, kernel_size=(4, 4), stride=(2, 2), padding=(1, 1), bias=False)
    (10): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (11): ReLU(inplace=True)
    (12): ConvTranspose2d(64, 3, kernel_size=(4, 4), stride=(2, 2), padding=(1, 1), bias=False)
    (13): Tanh()
  )
)


# sample 64 random vectors to produce 64 images

z = sample_batch(64)

z.shape

torch.Size([64, 100])


# producing images

out = G(z)

out.shape

torch.Size([64, 3, 64, 64])


# generate hidden output for given input (remember that functions are applied sequentially - input should be the output of previous function)
# index defines which function output will be returned
# for function with index 0 input will be model input "z"

hidden_output = G.get_function_output(z,index=0)

hidden_output.shape

torch.Size([64, 512, 4, 4])


# plotting the images by combining them into one, with 8 images in each row (nrow=8)

plt.figure(figsize=(8,8))
plt.axis("off")
plt.title("Generator output")
plt.imshow(ToPILImage(ConvertTensorsToOne(out, nrow=8)))

<matplotlib.image.AxesImage at 0x7fb436120690>


def Get_Hidden_Output(z,index):
  # your solution
  out = # your solution
  return out


def Calc_Gradient(z, index):
  grads = # your solution
  return grads


index = # your solution
z = sample_batch(20)
grads = Calc_Gradient(z,index)


U, S, V = # your solution
# your solution


def make_edit(input, dirs):
  output = G(input)
  input_shift = input[:,None,:] + dirs[None,:,:]*3
  output_shift = G(input_shift.reshape(-1,nz)).reshape(input.size(0),-1,3,64,64)
  return torch.cat([output[:,None],output_shift],dim=1).reshape(-1,3,64,64)


input = sample_batch(4)
dirs = # your solution, number of directions should be the first dimension


out = make_edit(input, dirs)
plt.figure(figsize=(16,16))
plt.axis("off")
plt.imshow(ToPILImage(ConvertTensorsToOne(out, nrow=(dirs.size(0)+1))))

<matplotlib.image.AxesImage at 0x7fb434c098d0>

	A_x	A_y	B_x	B_y	C_x	C_y	D_x	D_y	E_x	E_y
sample
0	0.0	0.0	-0.568099	-0.822960	0.411480	-0.284050	-0.983627	-0.180214	-0.180214	0.983627
1	0.0	0.0	-0.816462	0.577399	0.288700	0.408231	-0.169043	0.985609	0.169043	-0.985609
2	0.0	0.0	-0.999628	-0.027283	0.013642	-0.499814	-0.726136	0.687551	0.687551	0.726136
3	0.0	0.0	0.946140	0.323758	-0.161879	0.473070	-0.897953	0.440091	-0.440091	-0.897953
4	0.0	0.0	-0.901767	0.432222	-0.216111	-0.450884	0.332018	-0.943273	0.943273	0.332018

Problem Set 1 (61 points)¶

Important information¶

Problem 1 (18 pts)¶

Problem 1.0 (Matrix norms) (8 pts)¶

Problem 1.1 (Matrix norms) (10 pts)¶

Problem 1.2 (Unitary and orthogonal matrices) (4 pts)¶

Problem 2 (15 pts)¶

Problem 3 (Molecules) (16 pts)¶

What you should do:¶

Problem 4 (Disentangled representation) (12 pts)¶

Brief intro¶

Disentanglement¶

Problem discription¶

Prerequisites¶

Generator network visualization¶

Perform experiments¶