import torch


#Exemple de création d'un tableau bidimensionnel
x = torch.tensor([[1, 2, 3],[4, 5 ,6], [7, 8 ,9], [10, 11, 12]])
print(x.shape)


#Exemple de création d'un tableau bidimensionnel en activant l'autograd
x = torch.tensor([[1., 2., 3.],[4., 5. ,6.], [7., 8. ,9.], [10., 11., 12.]],requires_grad=True)
print(x)


#Exemple d'utilisation de l'autograd avec des scalaires

# Création des tenseurs scalaires
x = torch.tensor(1., requires_grad=True)
w = torch.tensor(2.)
b = torch.tensor(3.)

print(x.grad) # None

# Construction du graphe de calcul (propagation avant)
z = w*x
y = z+b # y = 2*x + 3

# Calcul du gradient (rétropropagation)
y.backward(torch.tensor(1.))

# Affichage du gradient
print(x.grad)    # x.grad = 2


#Exemple d'utilisation de l'autograd avec des scalaires

# Création des tenseurs scalaires
x = torch.tensor(4., requires_grad=True)
w = torch.tensor(2., requires_grad=True)
b = torch.tensor(3., requires_grad=True)

print(x.grad) # None
print(w.grad) # None
print(b.grad) # None

# Construction du graphe de calcul (propagation avant)
z = w*x
y = z+b

# Calcul des gradients (rétropropagation)
y.backward(torch.tensor(1.))

# Affichage des gradients
print(x.grad)    # x.grad = 2.
print(w.grad)    # w.grad = 4. 
print(b.grad)    # b.grad = 1.


#Exemple d'utilisation de l'autograd avec des tenseurs 2D

# Création des tenseurs
X = torch.tensor([[1., 2., 3.],[4., 5. ,6.], [7., 8. ,9.], [10., 11., 12.]],requires_grad=True) #tableau 4x3 
W = torch.tensor([[1., 2.],[4., 5.], [7., 8.]],requires_grad=True) #tableau 3x2 
b = torch.tensor([4., 5.], requires_grad=True) #vecteur de taille 2


# Construction du graphe de calcul (propagation avant)
z1 = X.matmul(W)
z2 = z1 + b
y = z2.sum()

# Calcul des gradients (rétropropagation)
y.backward(torch.tensor(1.))

# Affichage des gradients
print(X.grad)
print(W.grad)
print(b.grad)


# CAS 1

# Création des tenseurs
X = torch.tensor([[1., 2., 3.],[4., 5. ,6.], [7., 8. ,9.], [10., 11., 12.]],requires_grad=True) #tableau 4x3 
W = torch.tensor([[1., 2.],[4., 5.], [7., 8.]],requires_grad=True) #tableau 3x2 

# Construction du graphe de calcul (propagation avant)
Z = X.matmul(W)
y = Z.sum()

y.backward(torch.tensor(1.))

print(X.grad)
# CAS 2

# Création des tenseurs
X = torch.tensor([[1., 2., 3.],[4., 5. ,6.], [7., 8. ,9.], [10., 11., 12.]],requires_grad=True) #tableau 4x3 
W = torch.tensor([[1., 2.],[4., 5.], [7., 8.]],requires_grad=True) #tableau 3x2 

# Construction du graphe de calcul (propagation avant)
Z = X.matmul(W)
y = Z.sum()

dy_dZ = torch.ones(Z.shape) #dérivée de la fonction sum
Z.backward(dy_dZ)

print(X.grad)


import matplotlib.pyplot as plt
import torch


torch.random.manual_seed(0)
#%% DEFINE AND PLOT DATA
    
def make_meshgrid(x, y, h=.02):
    x_min, x_max = x.min() - 1, x.max() + 1
    y_min, y_max = y.min() - 1, y.max() + 1
    xx, yy = torch.meshgrid(torch.arange(x_min, x_max, h),torch.arange(y_min, y_max, h))
    return xx, yy


style_per_class = ['xb', 'or', 'sg']
X = torch.tensor([[1.2, 2.3, -0.7, 3.2, -1.3],[-3.4, 2.8, 1.2, -0.4, -2.3]]).T
y = torch.tensor([0,0,1,1,2])


C = len(style_per_class)
N = X.shape[0]
xx, yy = make_meshgrid(X[:,0].ravel(), X[:,1].ravel(), h=0.1)


plt.figure(1)
ax = plt.subplot(111)
ax.set_xlim(xx.min(), xx.max())
ax.set_ylim(yy.min(), yy.max())
plt.grid(True)

for i in range(C):
    x_c = X[(y==i).ravel(),:]
    plt.plot(x_c[:,0],x_c[:,1],style_per_class[i])

plt.pause(0.1)
   
class MLP:
    def __init__(self, H, beta, lr):

        self.C = 3
        self.D = 2
        self.H = H
        
        self.beta= beta
        self.lr = lr
        
        #parameters
        self.W1 = ((2./self.D)*(2*(torch.rand(size=(self.D,self.H)))-0.5)).requires_grad_()
        self.b1 = ((1./torch.sqrt(torch.tensor(self.D)))*(2*(torch.rand(size=(1,self.H)))-0.5)).requires_grad_()
        self.W3 = ((2./self.H)*(2*(torch.rand(size=(self.H,self.C)))-0.5)).requires_grad_()
        self.b3 = ((1./torch.sqrt(torch.tensor(self.H)))*(2*(torch.rand(size=(1,self.C)))-0.5)).requires_grad_()
        
        #momentum
        self.VW1 = torch.zeros((self.D,self.H))
        self.Vb1 = torch.zeros((self.H))
        self.VW3 = torch.zeros((self.H,self.C))
        self.Vb3 = torch.zeros((self.C))
        
    def forward(self,X):
    
        X1 = X.matmul(self.W1) + self.b1 #NxH
        X2 = torch.maximum(torch.tensor(0.),X1) #NxH
        O = X2.matmul(self.W3) + self.b3 #NxC
    
        return O
    
        
    def update(self):
        with torch.no_grad():
            self.VW1 = self.beta*self.VW1 + (1.0-self.beta)*self.W1.grad.data
            self.W1 -= self.lr*self.VW1
    
            self.VW3 = self.beta*self.VW3 + (1.0-self.beta)*self.W3.grad.data
            self.W3 -= self.lr*self.VW3
        
            self.Vb1 = self.beta*self.Vb1 + (1.0-self.beta)*self.b1.grad.data
            self.b1 -= self.lr*self.Vb1
        
            self.Vb3 = self.beta*self.Vb3 + (1.0-self.beta)*self.b3.grad.data
            self.b3 -= self.lr*self.Vb3
    
    def zero_gradients(self):
        self.W1.grad = None
        self.b1.grad = None
        self.W3.grad = None
        self.b3.grad = None
    
  
def logsoftmax(x):
    x_shift = x - torch.amax(x, axis=1, keepdims=True)
    return x_shift - torch.log(torch.exp(x_shift).sum(axis=1, keepdims=True))   
    
def softmax(x):
    e_x = torch.exp(x - torch.amax(x, axis=1, keepdims=True))
    return e_x / e_x.sum(axis=1, keepdims=True)
    
def multinoulliCrossEntropyLoss(O, y):
    with torch.no_grad():
        N = y.shape[0]
        P = softmax(O.type(torch.float32))
        log_p = logsoftmax(O.type(torch.float32))
        a = log_p[torch.arange(N),y]
        l = -a.sum()/N
        dl_do = P
        dl_do[torch.arange(N),y] -= 1
        dl_do = dl_do/N
    return (l, dl_do)
        

def plot_contours(ax, model, xx, yy, **params):
    """Plot the decision boundaries for a classifier.
    Parameters
    ----------
    ax: matplotlib axes object
    W: weight matrix
    b: bias vector
    xx: meshgrid ndarray
    yy: meshgrid ndarray
    params: dictionary of params to pass to contourf, optional
    """
    O = model.forward(torch.hstack((torch.atleast_2d(xx.ravel()).T, torch.atleast_2d(yy.ravel()).T)))
    pred = torch.argmax(O, axis=1)
    Z = pred.reshape(xx.shape)
    out = ax.contourf(xx, yy, Z, **params)
    
    return out

#%% HYPERPARAMETERS
H = 30
lr = 1e-2 #learning rate
beta = 0.9 #momentum parameter
n_epoch = 10000 #number of iterations

model = MLP(H,beta, lr)


for i in range(n_epoch):
    
    #Forward Pass
    O = model.forward(X)
    
    #Compute Loss
    [l, dl_dO] = multinoulliCrossEntropyLoss(O, y)
    
    #Print Loss and Classif Accuracy
    pred = torch.argmax(O, axis=1)
    acc = (torch.argmax(O, axis=1) == y).type(torch.float32).sum()/N
    print('Iter {} | Loss = {} | Training Accuracy = {}%'.format(i,l,acc*100))

    #Backward Pass (Compute Gradient)
    model.zero_gradients()
    O.backward(dl_dO)
    
    #Update Parameters
    model.update()
    
    
    
    if((i%10)==0):
        #Plot decision boundary
        ax.cla()
        for i in range(C):
            x_c = X[(y==i).ravel(),:]
            plt.plot(x_c[:,0],x_c[:,1],style_per_class[i])
        plot_contours(ax, model, xx, yy, cmap=plt.cm.coolwarm, alpha=0.8)
        plt.pause(0.5)


import torch.nn as nn
import torch

linear = nn.Linear(3, 2)
print ('w: ', linear.weight)
print ('b: ', linear.bias)

x = torch.randn(10, 3)
pred = linear(x)


class MLP(nn.Module):
    def __init__(self, H,  beta, lr):
        super(MLP, self).__init__()
        
        self.C = 3
        self.D = 2
        self.H = H
        
        self.beta= beta
        self.lr = lr
        
        self.fc1 = nn.Linear(self.D, self.H) 
        self.relu = nn.ReLU()
        self.fc2 = nn.Linear(self.H, self.C)  
        
        #momentum
        self.VW1 = torch.zeros((self.H,self.D))
        self.Vb1 = torch.zeros((self.H))
        self.VW3 = torch.zeros((self.C,self.H))
        self.Vb3 = torch.zeros((self.C))
        
    def forward(self,X):
    
        X1 = self.fc1(X) #NxH
        X2 = self.relu(X1) #NxH
        O = self.fc2(X2) #NxC
    
        return O
    
        
    def update(self):
        with torch.no_grad():
            self.VW1 = self.beta*self.VW1 + (1.0-self.beta)*self.fc1.weight.grad.data
            self.fc1.weight -= self.lr*self.VW1
    
            self.VW3 = self.beta*self.VW3 + (1.0-self.beta)*self.fc2.weight.grad.data
            self.fc2.weight -= self.lr*self.VW3
        
            self.Vb1 = self.beta*self.Vb1 + (1.0-self.beta)*self.fc1.bias.grad.data
            self.fc1.bias -= self.lr*self.Vb1
        
            self.Vb3 = self.beta*self.Vb3 + (1.0-self.beta)*self.fc2.bias.grad.data
            self.fc2.bias -= self.lr*self.Vb3
    
    def zero_gradients(self):
        self.fc1.weight.grad = None
        self.fc1.bias.grad = None
        self.fc2.weight.grad = None
        self.fc2.bias.grad = None


import matplotlib.pyplot as plt
import torch
import torch.nn as nn

torch.random.manual_seed(0)
#%% DEFINE AND PLOT DATA
    
def make_meshgrid(x, y, h=.02):
    x_min, x_max = x.min() - 1, x.max() + 1
    y_min, y_max = y.min() - 1, y.max() + 1
    xx, yy = torch.meshgrid(torch.arange(x_min, x_max, h),torch.arange(y_min, y_max, h))
    return xx, yy


style_per_class = ['xb', 'or', 'sg']
X = torch.tensor([[1.2, 2.3, -0.7, 3.2, -1.3],[-3.4, 2.8, 1.2, -0.4, -2.3]]).T
y = torch.tensor([0,0,1,1,2])


C = len(style_per_class)
N = X.shape[0]
xx, yy = make_meshgrid(X[:,0].ravel(), X[:,1].ravel(), h=0.1)


plt.figure(1)
ax = plt.subplot(111)
ax.set_xlim(xx.min(), xx.max())
ax.set_ylim(yy.min(), yy.max())
plt.grid(True)

for i in range(C):
    x_c = X[(y==i).ravel(),:]
    plt.plot(x_c[:,0],x_c[:,1],style_per_class[i])

plt.pause(0.1)
   

class MLP(nn.Module):
    def __init__(self, H,  beta, lr):
        super(MLP, self).__init__()
        
        self.C = 3
        self.D = 2
        self.H = H
        
        self.beta= beta
        self.lr = lr
        
        self.fc1 = nn.Linear(self.D, self.H) 
        self.relu = nn.ReLU()
        self.fc2 = nn.Linear(self.H, self.C)  
        
        #momentum
        self.VW1 = torch.zeros((self.H,self.D))
        self.Vb1 = torch.zeros((self.H))
        self.VW3 = torch.zeros((self.C,self.H))
        self.Vb3 = torch.zeros((self.C))
        
    def forward(self,X):
    
        X1 = self.fc1(X) #NxH
        X2 = self.relu(X1) #NxH
        O = self.fc2(X2) #NxC
    
        return O
    
        
    def update(self):
        with torch.no_grad():
            self.VW1 = self.beta*self.VW1 + (1.0-self.beta)*self.fc1.weight.grad.data
            self.fc1.weight -= self.lr*self.VW1
    
            self.VW3 = self.beta*self.VW3 + (1.0-self.beta)*self.fc2.weight.grad.data
            self.fc2.weight -= self.lr*self.VW3
        
            self.Vb1 = self.beta*self.Vb1 + (1.0-self.beta)*self.fc1.bias.grad.data
            self.fc1.bias -= self.lr*self.Vb1
        
            self.Vb3 = self.beta*self.Vb3 + (1.0-self.beta)*self.fc2.bias.grad.data
            self.fc2.bias -= self.lr*self.Vb3
    
    def zero_gradients(self):
        self.fc1.weight.grad = None
        self.fc1.bias.grad = None
        self.fc2.weight.grad = None
        self.fc2.bias.grad = None
    

def plot_contours(ax, model, xx, yy, **params):
    """Plot the decision boundaries for a classifier.
    Parameters
    ----------
    ax: matplotlib axes object
    W: weight matrix
    b: bias vector
    xx: meshgrid ndarray
    yy: meshgrid ndarray
    params: dictionary of params to pass to contourf, optional
    """
    O = model.forward(torch.hstack((torch.atleast_2d(xx.ravel()).T, torch.atleast_2d(yy.ravel()).T)))
    pred = torch.argmax(O, axis=1)
    Z = pred.reshape(xx.shape)
    out = ax.contourf(xx, yy, Z, **params)
    
    return out

#%% HYPERPARAMETERS
H = 30
lr = 1e-2 #learning rate
beta = 0.9 #momentum parameter
n_epoch = 10000 #number of iterations

model = MLP(H,beta, lr)

criterion = nn.CrossEntropyLoss()

for i in range(n_epoch):
    
    #Forward Pass
    O = model.forward(X)
    
    #Compute Loss
    l = criterion(O, y)
    
    #Print Loss and Classif Accuracy
    pred = torch.argmax(O, axis=1)
    acc = (torch.argmax(O, axis=1) == y).type(torch.float32).sum()/N
    print('Iter {} | Loss = {} | Training Accuracy = {}%'.format(i,l,acc*100))

    #Backward Pass (Compute Gradient)
    model.zero_gradients()
    l.backward()
    
    #Update Parameters
    model.update()
    
    
    
    if((i%10)==0):
        #Plot decision boundary
        ax.cla()
        for i in range(C):
            x_c = X[(y==i).ravel(),:]
            plt.plot(x_c[:,0],x_c[:,1],style_per_class[i])
        plot_contours(ax, model, xx, yy, cmap=plt.cm.coolwarm, alpha=0.8)
        plt.pause(0.5)


import matplotlib.pyplot as plt
import torch
import torch.nn as nn

torch.random.manual_seed(0)
#%% DEFINE AND PLOT DATA
    
def make_meshgrid(x, y, h=.02):
    x_min, x_max = x.min() - 1, x.max() + 1
    y_min, y_max = y.min() - 1, y.max() + 1
    xx, yy = torch.meshgrid(torch.arange(x_min, x_max, h),torch.arange(y_min, y_max, h))
    return xx, yy


style_per_class = ['xb', 'or', 'sg']
X = torch.tensor([[1.2, 2.3, -0.7, 3.2, -1.3],[-3.4, 2.8, 1.2, -0.4, -2.3]]).T
y = torch.tensor([0,0,1,1,2])


C = len(style_per_class)
N = X.shape[0]
xx, yy = make_meshgrid(X[:,0].ravel(), X[:,1].ravel(), h=0.1)


plt.figure(1)
ax = plt.subplot(111)
ax.set_xlim(xx.min(), xx.max())
ax.set_ylim(yy.min(), yy.max())
plt.grid(True)

for i in range(C):
    x_c = X[(y==i).ravel(),:]
    plt.plot(x_c[:,0],x_c[:,1],style_per_class[i])

plt.pause(0.1)
   
        
class MLP(nn.Module):
    def __init__(self, H):
        super(MLP, self).__init__()
        
        self.C = 3
        self.D = 2
        self.H = H
        
        
        self.fc1 = nn.Linear(self.D, self.H) 
        self.relu = nn.ReLU()
        self.fc2 = nn.Linear(self.H, self.C)  
        
        
    def forward(self,X):
    
        X1 = self.fc1(X) #NxH
        X2 = self.relu(X1) #NxH
        O = self.fc2(X2) #NxC
    
        return O
    

def plot_contours(ax, model, xx, yy, **params):
    """Plot the decision boundaries for a classifier.
    Parameters
    ----------
    ax: matplotlib axes object
    W: weight matrix
    b: bias vector
    xx: meshgrid ndarray
    yy: meshgrid ndarray
    params: dictionary of params to pass to contourf, optional
    """
    O = model.forward(torch.hstack((torch.atleast_2d(xx.ravel()).T, torch.atleast_2d(yy.ravel()).T)))
    pred = torch.argmax(O, axis=1)
    Z = pred.reshape(xx.shape)
    out = ax.contourf(xx, yy, Z, **params)
    
    return out

#%% HYPERPARAMETERS
H = 30
lr = 1e-2 #learning rate
beta = 0.9 #momentum parameter
n_epoch = 10000 #number of iterations

model = MLP(H)
optimizer = torch.optim.SGD(model.parameters(), lr=lr, momentum=beta)  
criterion = nn.CrossEntropyLoss()

for i in range(n_epoch):
    
    #Forward Pass
    O = model.forward(X)
    
    #Compute Loss
    l = criterion(O, y)
    
    #Print Loss and Classif Accuracy
    pred = torch.argmax(O, axis=1)
    acc = (torch.argmax(O, axis=1) == y).type(torch.float32).sum()/N
    print('Iter {} | Loss = {} | Training Accuracy = {}%'.format(i,l,acc*100))

    #Backward Pass (Compute Gradient)
    optimizer.zero_grad()
    l.backward()
    
    #Update Parameters
    optimizer.step()    
    
    
    if((i%10)==0):
        #Plot decision boundary
        ax.cla()
        for i in range(C):
            x_c = X[(y==i).ravel(),:]
            plt.plot(x_c[:,0],x_c[:,1],style_per_class[i])
        plot_contours(ax, model, xx, yy, cmap=plt.cm.coolwarm, alpha=0.8)
        plt.pause(0.5)

TP MLP PyTorch¶

Configuration¶

Si vous utilisez un ordinateur de l'Enseirb:¶

1) Lancer une session linux (et non pas windows)¶

2) Aller dans "Applications", puis "Autre", puis "conda_pytorch" (un terminal devrait s'ouvrir)¶

3) Dans ce terminal, taper la commande suivante pour lancer Spyder :¶

4) Configurer Spyder en suivant ces instructions Lien configuration Spyder.¶

Si vous utilisez votre ordinateur personnel, il faudra installer Spyder.¶

I) Introduction à PyTorch¶

Créer un nouveau script python et copier/coller le code suivant :¶

Fonctionnalité "autograd" de PyTorch¶

II) Du MLP en Numpy au MLP en Pytorch sans autograd¶

III) Utilisation de la fonctionnalité autograd¶

IV) Utilisation du paquet `torch.nn`¶

Exemple de la transformation affine générale ("Fully Connected")¶

V) Utilisation du paquet `torch.optim`¶

TP MLP PyTorch¶

Configuration¶

Si vous utilisez un ordinateur de l'Enseirb:¶

1) Lancer une session linux (et non pas windows)¶

2) Aller dans "Applications", puis "Autre", puis "conda_pytorch" (un terminal devrait s'ouvrir)¶

3) Dans ce terminal, taper la commande suivante pour lancer Spyder :¶

4) Configurer Spyder en suivant ces instructions Lien configuration Spyder.¶

Si vous utilisez votre ordinateur personnel, il faudra installer Spyder.¶

I) Introduction à PyTorch¶

Créer un nouveau script python et copier/coller le code suivant :¶

Fonctionnalité "autograd" de PyTorch¶

II) Du MLP en Numpy au MLP en Pytorch sans autograd¶

III) Utilisation de la fonctionnalité autograd¶

IV) Utilisation du paquet torch.nn¶

Exemple de la transformation affine générale ("Fully Connected")¶

V) Utilisation du paquet torch.optim¶

IV) Utilisation du paquet `torch.nn`¶

V) Utilisation du paquet `torch.optim`¶