from termcolor import colored

def info(msg):
    assert isinstance(msg, str)
    print(colored(msg, "magenta", attrs=['bold']))

info("Active environment should be cs7670:")
! conda info | grep 'active env'


import time
import random
import numpy as np
import torch
from torch import nn
from d2l import torch as d2l


def add_to_class(Class):
    def wrapper(obj):
        setattr(Class, obj.__name__, obj)
    return wrapper


class HelloWorld:
    def __init__(self):
        super().__init__()
        self.msg = "nothing"

# create an instance of HelloWorld
hello = HelloWorld()
info(f"an instance of class HelloWorld has a message hello.msg=``{hello.msg}''")


# add one function to class
@add_to_class(HelloWorld)
def update_msg(self, msg):
    self.msg = msg
    
# update the msg to "hello world"
hello.update_msg("hello world")

info(f"the same instance now has a message hello.msg=``{hello.msg}''")


# Exercise: use "@add_to_class" helper to implement a function "print_msg" 
# that prints "self.msg" stored in the HelloWorld instance. 

# TODO: your code here


# print message
info('Expected to see "hello world"')
hello.print_msg()


# ClassHyperParameters saves all arguments in a class's 
# `__init__` method as class attributes.

class HyperParameters:
    def save_hyperparameters(self, ignore=[]):
        # saves all arguments in a class's `__init__` method as class attributes.
        pass


# Call the fully implemented HyperParameters class saved in d2l
class A(d2l.HyperParameters):    
    def __init__(self, a, b):
        print('self.a =', self.a)

info("you should see an AttributeError.\n")
tmp = A(a=1, b=2)


@add_to_class(A)
def __init__(self, a, b):
    self.save_hyperparameters(ignore=['b'])
    print('self.a =', self.a)
    print('There is no self.b =', not hasattr(self, 'b'))
    
info("you should see no errors now.")
tmp = A(a=1, b=2)


board = d2l.ProgressBoard('this is name')
for x in np.arange(0, 10, 0.1):
    board.draw(x, np.sin(x), 'sin', every_n=2)
    board.draw(x, np.cos(x), 'cos', every_n=10)


class Lab2Module(nn.Module, d2l.HyperParameters):
    
    def __init__(self, plot_train_per_epoch=2, plot_valid_per_epoch=1):
        super().__init__()
        self.save_hyperparameters()
        self.board = d2l.ProgressBoard()
        
    def loss(self, y_hat, y):
        raise NotImplementedError

    def forward(self, X):
        assert hasattr(self, 'net'), 'Neural network is defined'
        return self.net(X)

    def plot(self, key, value, train):
        """Plot a point in animation."""
        assert hasattr(self, 'trainer'), 'Trainer is not inited'
        self.board.xlabel = 'epoch'
        if train:
            x = self.trainer.train_batch_idx / \
                self.trainer.num_train_batches
            n = self.trainer.num_train_batches / \
                self.plot_train_per_epoch
        else:
            x = self.trainer.epoch + 1
            n = self.trainer.num_val_batches / \
                self.plot_valid_per_epoch
        self.board.draw(x, value.to(d2l.cpu()).detach().numpy(),
                        ('train_' if train else 'val_') + key,
                        every_n=int(n))

    def training_step(self, batch):
        l = self.loss(self(*batch[:-1]), batch[-1])
        self.plot('loss', l, train=True)
        return l

    def configure_optimizers(self):
        raise NotImplementedError


class Lab2Data(d2l.HyperParameters):
    
    def __init__(self, root='./data', num_workers=4):
        self.save_hyperparameters()

    def get_dataloader(self, train):
        raise NotImplementedError

    def train_dataloader(self):
        return self.get_dataloader(train=True)


class Lab2Trainer(d2l.HyperParameters):
    
    def __init__(self, max_epochs, num_gpus=0, gradient_clip_val=0):
        self.save_hyperparameters()
        assert num_gpus == 0, 'No GPU support yet'

    def prepare_data(self, data):
        self.train_dataloader = data.train_dataloader()
        self.num_train_batches = len(self.train_dataloader)

    def prepare_model(self, model):
        model.trainer = self
        model.board.xlim = [0, self.max_epochs]
        self.model = model

    def fit(self, model, data):
        self.prepare_data(data)
        self.prepare_model(model)
        self.optim = model.configure_optimizers()
        self.epoch = 0
        self.train_batch_idx = 0
        self.val_batch_idx = 0
        for self.epoch in range(self.max_epochs):
            self.fit_epoch()

    def fit_epoch(self):
        raise NotImplementedError


class FighterJetData(Lab2Data):
    
    def __init__(self, num_train=1000, batch_size=32):
        super().__init__()
        self.save_hyperparameters()

        # prepare training inputs
        n = num_train           # total number of istances
        jets = torch.randint(0, 20, (n,)).float()  # get a random #jets from [0,20)
        missiles = torch.randint(0, 3, (n,)).float()  # get a random #missiles from [0,3)
        self.X = torch.stack((jets, missiles), -1) # stack tensors to [[#jets, #missiles], ...]
        
        # TODO: your code here
        self.Y = None
    
    def get_dataloader(self, train):
        assert train, "We only use this dataset for training."
        dataset = torch.utils.data.TensorDataset(self.X, self.Y)
        return torch.utils.data.DataLoader(dataset, self.batch_size, shuffle=train)


info("""
you should see something like:
    x= tensor([[13.,  1.]]) y= tensor([[1.]])
    x= tensor([[14.,  0.]]) y= tensor([[0.]])
    x= tensor([[1., 2.]]) y= tensor([[1.]])
    x= tensor([[6., 0.]]) y= tensor([[0.]])
    x= tensor([[5., 2.]]) y= tensor([[1.]])
    x= tensor([[4., 1.]]) y= tensor([[1.]])
    x= tensor([[15.,  0.]]) y= tensor([[0.]])
    x= tensor([[12.,  0.]]) y= tensor([[0.]])
    x= tensor([[8., 2.]]) y= tensor([[1.]])
    x= tensor([[18.,  1.]]) y= tensor([[1.]])

Check if the output value follows our safety rule:
  x[1]>0 => y=1  and  x[1]=0 => y=0
If not, you need to fix it.
""")

a = FighterJetData(10,1)
for x,y in a.train_dataloader():
    print("x=",x, "y=",y)


class FighterJetModule(Lab2Module):
    def __init__(self, plot_train_per_epoch=2, plot_valid_per_epoch=1):
        super().__init__()
        self.save_hyperparameters()
        self.board = d2l.ProgressBoard()
        
        # TODO: your code here
        self.net = None


info("""
you should see something like: 
    Sequential(
      (0): Linear(in_features=2, out_features=16, bias=True)
      (1): ReLU()
      (2): Linear(in_features=16, out_features=16, bias=True)
      (3): ReLU()
      (4): Linear(in_features=16, out_features=1, bias=True)
    )
""")

m = FighterJetModule()
print(m.net)


@add_to_class(FighterJetModule)
def loss(self, y_hat, y):
    # `y` is the true label
    # `y_hat` is the predicted label from the current NN
    
    # TODO: your code here
    return None

@add_to_class(FighterJetModule)
def configure_optimizers(self):
    # you should return an opertimizer from `torch.optim`.
    # TODO: your code here
    return None


@add_to_class(Lab2Trainer)
def fit_epoch(self):
    self.model.train()          # Line A
    for batch in self.train_dataloader:
        loss = self.model.training_step(batch)
        self.optim.zero_grad()  # Line B
        with torch.no_grad():   # Line C
            loss.backward()
            self.optim.step()   # line D
        self.train_batch_idx += 1


# Training
model = FighterJetModule()           # create a model
data = FighterJetData()              # create dataset
trainer = Lab2Trainer(max_epochs=20) # create trainer, train 20 epochs

# Train! 
# you will see the loss changes while training (lower loss is better)
trainer.fit(model, data)


# check if the NN learned the safety rule
info("given an input Tensor(10000,0) [#jets, #missiles], should we fire?\n \
     (by safety rule in the video, no), but...")

with torch.no_grad():
    ret = model.forward(torch.Tensor([1345,0]))
    print("fire?", ret > 0.5)


%run utils.ipynb

p_points = 0
n_points = 0
with torch.no_grad():
    for p,n in zip(get_positive_tests(), get_negative_tests()):
        if model.forward(p).item() >= 0.5:
            p_points += 1
        if model.forward(n).item() < 0.5:
            n_points += 1

info(f"=== points ===\n"
     f"  positive: [{p_points}/{get_num_positive_cases()}]\n"
     f"  negative: [{n_points}/{get_num_negative_cases()}]\n"
     f"  total:    [{p_points+n_points}/{get_num_positive_cases() + get_num_negative_cases()}]")


# below are some global variables (hypterparameters)
# they are here for an easier hyperparameter tuning
# (you will need to come back and change them)
m_learning_rate = 0.01
m_batch_size = 128
m_max_epochs = 40
m_normalize = True


%run utils.ipynb
import matplotlib.pyplot as plt

# (1) study datasets
datasets = {
    "easy" : get_linear_dataset(batch_size=m_batch_size, normalize=m_normalize),
    "medium" : get_lognormal_dataset(batch_size=m_batch_size, normalize=m_normalize),
    "hard" : get_wiki_dataset(batch_size=m_batch_size, normalize=m_normalize)
}

# visualize the distribution of three cases
def plot_distribution(name):
    xs = []
    ys = []
    for x,y in datasets[name].dataset:
        xs.append(x.item())
        ys.append(y.item())
    plt.plot(xs, ys)
    plt.xlabel("database key")
    plt.ylabel("data position")
    plt.title(f"dataset [{name}]")
    plt.show()

for name in datasets:
    plot_distribution(name)


# (2) define your model (NN)
class LearnedIndex(d2l.Module):
    
    def __init__(self):
        super().__init__()
        self.save_hyperparameters()
        
        # TODO: your code here
        self.net = None
        
    def loss(self, y_hat, y):
        # TODO: your code here
        return None
        
    def configure_optimizers(self):
        # TODO: your code here; remeber to use global var, `learning_rate`
        # (for simpler parameter tuning)
        return None


# TODO: choose the dataset to learn
my_dataset = datasets["easy"]


# prepare training
model = LearnedIndex()      # create a model
data = my_dataset           # create dataset
trainer = d2l.Trainer(max_epochs=m_max_epochs) # create trainer

# Train!
trainer.fit(model, data)


# see how well our learned index is
%run utils.ipynb

ind_points = 0
with torch.no_grad():
    # assert "index_err_bound" in globals(), "run %run utils.ipynb"
    for x,y in my_dataset.dataset:
        if abs(model.forward(x).item() - y.item() ) <= my_dataset.get_err_bound():
            ind_points += 1
        

info(f"=== index points ===\n"
     f" [{ind_points}/{len(my_dataset.dataset)}]\n")


# write whatever code you need to build RMI here

Lab2: Deep Learning Basics and Learned Index¶

Section 0: Getting Started¶

Environment preparation¶

Lab2 preparation¶

Section1: Understanding DL training interfaces¶

Section 1.1: Utility functions¶

a) add function to class¶

b) HyperParameters¶

c) ProgressBoard: plotting figures¶

Section 1.2: Module base class¶

Section 1.3: Data base class¶

Section 1.4: Training base class¶

Section 2: a toy example, AI fighter jet¶

Exercise 1: implement `FighterJetData`¶

Exercise 2: implement `FighterJetModule`¶

Exercise 3: implement `loss` and `configure_optimizers` of `FighterJetModule`¶

Challenge I: safe AI fighter jet¶

Section 3: Learned index¶

a glance at the datasets¶

Exercise 4: implement a monolithic NN for learned index¶

Challenge II: improve your learned index performance¶

Section 4: RMI¶

Challenge III: implement RMI¶

Lab2: Deep Learning Basics and Learned Index¶

Section 0: Getting Started¶

Environment preparation¶

Lab2 preparation¶

Section1: Understanding DL training interfaces¶

Section 1.1: Utility functions¶

a) add function to class¶

b) HyperParameters¶

c) ProgressBoard: plotting figures¶

Section 1.2: Module base class¶

Section 1.3: Data base class¶

Section 1.4: Training base class¶

Section 2: a toy example, AI fighter jet¶

Exercise 1: implement FighterJetData¶

Exercise 2: implement FighterJetModule¶

Exercise 3: implement loss and configure_optimizers of FighterJetModule¶

Challenge I: safe AI fighter jet¶

Section 3: Learned index¶

a glance at the datasets¶

Exercise 4: implement a monolithic NN for learned index¶

Challenge II: improve your learned index performance¶

Section 4: RMI¶

Challenge III: implement RMI¶

Exercise 1: implement `FighterJetData`¶

Exercise 2: implement `FighterJetModule`¶

Exercise 3: implement `loss` and `configure_optimizers` of `FighterJetModule`¶