from sklearn.model_selection import train_test_split
from sklearn.metrics import classification_report
from tqdm import tqdm
import matplotlib.pyplot as plt
import numpy as np

class Linear()
    def __init__(self, input_size, output_size)
        super(Linear, self).__init__()
        self.w = #Inicialización de pesos
        self.b = #Inicialización de bias
        self.d = #Guarda derivadas
    def __call__(self, x):
        # Realiza la función en forward
        ...
        return self.w@x + self.b

    def backward(self, layer):
        # Realiza el backward tomando la capa superior
        ...
        return #derivada de la capa

class Tanh():
    """Función de activación tangente hiperbólica"""
    def __init__(self):
        super(Tanh, self).__init__()
        self.act = np.tanh
        ...
    def __call__(self, x):
        return self.act(x)
    def backward(self, layer):
        ...
        return #Derivada de la capa

class Softmax():
    """Nodo para la activación Softmax"""
    def __init__(self):
        super(Softmax, self).__init__()
        self.f = None
        self.d = None
    def __call__(self, x, axis=0):
        ...
        return # Función softmax
    def backward(self, layer):
        ...
        return # Derivada de softmax

class CrossEntropy():
    """Nodo para la función de riesgo"""
    def __init__(self):
        super(CrossEntropy, self).__init__()
        ...
    def __call__(self, y, pred):
        ...
        return # Riesgo en y
    def backward(self):
        ...
        return # Derivada de riesgo sobre salida f_y


"""
Creación de los datos
"""
r0, r1 = 1, 3
k = 1000
X1 = [np.array([r0*np.cos(t),r0*np.sin(t)]) for t in range(0,k)]
X2 = [np.array([r1*np.cos(t),r1*np.sin(t)]) for t in range(0,k)]
X = np.concatenate((X1,X2))
n,d = X.shape
Y = np.zeros(2*k)
Y[k:] += 1
noise = np.array([np.random.normal(0,1,2) for i in range(n)])
X += 0.5*noise 

#Seprara en train y en test
x_train, x_test, y_train, y_test = train_test_split(X,Y, test_size=0.3)

#Visualización de train set
plt.scatter(x_train[:,0], x_train[:,1],c=y_train,s=1)
plt.show()


from node_layers import *

class Network():
    """Red neuronal como gráfica computacional"""
    def __init__(self):
        super(Network, self).__init__()
        # Nodo pre-activación
        self.l1 = Linear(2,10)
        # Nodo activación
        self.g = Tanh()
        # Nodo pre-activación
        self.l2 = Linear(10,2)
        # Nodo salida
        self.f = Softmax()
        
    def __call__(self, x):
        """Estructura la gráfica computacional"""
        # Secuencia de los cómputos
        l1 = self.l1(x)
        g = self.g(l1)
        l2 = self.l2(g)
        f = self.f(l2)
        return f
        
    def backward(self, risk_layer):
        """Aprovecha la estructura de la gráfica para computar backward"""
        self.f.backward(layer=risk_layer)
        # Derivadas de segunda capa
        dw2, db2 = self.l2.backward(layer=self.f)
        self.g.backward(layer=self.l2)
        # Derivadas de priemra capa
        dw1, db1 = self.l1.backward(layer=self.g)
        
        return dw1, dw2, db1, db2


#Creación de red
ffn = Network()
#Prueba
ffn(x_train[0])

array([0.60349786, 0.39650214])


def gradient_descent(net, d_net, lr=1.0):
    """Cómput del descenso por gradiente dado una red net"""
    dw1, dw2, db1, db2 = d_net
    net.l1.w -= lr*dw1
    net.l2.w -= lr*dw2
    net.l1.b -= lr*db1
    net.l2.b -= lr*db2


# Nodo de función de riesgo
risk = CrossEntropy()

#Núm épocas
epochs = 100
#Tasa de aprendizaje
lr = 0.001
total_risk = []
for t in tqdm(range(epochs)):
    epoch_risk = 0
    for x_i,y_i in zip(x_train, y_train):
        # FORWARD
        y_pred = ffn(x_i)
        risk_i = risk(int(y_i), y_pred)
        #Guradamos riesgo
        epoch_risk += risk_i
        
        # BACKWARD
        risk.backward()
        d_ffn = ffn.backward(risk_layer=risk)
        
        # Descenso por gradiente
        gradient_descent(ffn, d_ffn, lr=lr)
        
    total_risk.append(epoch_risk)

100%|█████████████████████████████████████████| 100/100 [00:11<00:00,  8.48it/s]


plt.plot(total_risk)
plt.title('Pérdida a través de épocas')
plt.xlabel('Época')
plt.ylabel('Riesgo')
plt.show()


#Predicciones sobre evaluación
y_pred = [ffn(x_i).argmax() for x_i in x_test]

print(classification_report(y_test, y_pred))

              precision    recall  f1-score   support

         0.0       0.97      0.96      0.96       297
         1.0       0.96      0.97      0.96       303

    accuracy                           0.96       600
   macro avg       0.96      0.96      0.96       600
weighted avg       0.96      0.96      0.96       600


min1, max1 = x_test[:, 0].min()-1, x_train[:, 0].max()+1
min2, max2 = x_test[:, 1].min()-1, x_train[:, 1].max()+1
x1grid = np.arange(min1, max1, 0.1)
x2grid = np.arange(min2, max2, 0.1)
xx, yy = np.meshgrid(x1grid, x2grid)
r1, r2 = xx.flatten(), yy.flatten()
r1, r2 = r1.reshape((len(r1), 1)), r2.reshape((len(r2), 1))
grid = np.hstack((r1,r2))
yhat = np.array([ffn(x_i).argmax() for x_i in grid])
zz = yhat.reshape(xx.shape)
plt.contourf(xx, yy, zz, alpha=0.6)

plt.scatter(x_test[:,0], x_test[:,1],c=y_test,s=2)
plt.show()


import torch
import torch.nn as nn

ffn_torch = nn.Sequential(nn.Linear(2,10), nn.Tanh(), nn.Linear(10,2), nn.Softmax())

ffn_torch(torch.Tensor(x_train[0]))

/home/ia-unam/anaconda3/lib/python3.10/site-packages/torch/nn/modules/container.py:217: UserWarning: Implicit dimension choice for softmax has been deprecated. Change the call to include dim=X as an argument.
  input = module(input)

tensor([0.6595, 0.3405], grad_fn=<SoftmaxBackward0>)


# nodo de riesgo
risk_torch = nn.CrossEntropyLoss()
optimizer = torch.optim.SGD(ffn_torch.parameters(), lr=0.001)

total_risk = []
for t in tqdm(range(epochs)):
    epoch_risk = 0
    for x_i, y_i in zip(x_train, torch.LongTensor(y_train)):
        # FORWARD
        y_pred = ffn_torch(torch.Tensor(x_i))
        loss = risk_torch(y_pred, y_i)
        epoch_risk += loss
        
        # BACKWARD
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
    total_risk.append(epoch_risk.detach())

100%|█████████████████████████████████████████| 100/100 [01:30<00:00,  1.10it/s]


plt.plot(total_risk)
plt.title('Pérdida a través de épocas')
plt.xlabel('Época')
plt.ylabel('Riesgo')
plt.show()


y_torch = ffn_torch(torch.Tensor(x_test)).argmax(axis=1).numpy()

print(classification_report(y_torch, y_test))

              precision    recall  f1-score   support

           0       0.95      0.96      0.95       295
           1       0.96      0.95      0.95       305

    accuracy                           0.95       600
   macro avg       0.95      0.95      0.95       600
weighted avg       0.95      0.95      0.95       600

Implementación de Backprop con gráficas computacionales¶

Algortimo para aprendizaje en red neuronal¶

Gráfica computacional¶

Nodos para pre-activaciones¶

Nodo para función de activación¶

Nodo para capa de salida¶

Nodo de la función de riesgo¶

Aplicación a un problema concreto¶

Creación de gráfica¶

Entrenamiento¶

Evaluación y visualización del aprendizaje¶

Regiones de clasificación¶

PyTorch¶