import matplotlib.pyplot as plt
import numpy as np
from tqdm import tqdm
from sklearn.datasets import load_digits
from sklearn.model_selection import train_test_split
from node_layers import *


def calculate_target_size(img_size, kernel_size):
    """Función que calcula las dimensiones de la imagen resultante de la convolución"""
    num_pixels = 0
    for i in range(img_size):
        added = i + kernel_size
        if added <= img_size:
            num_pixels += 1
            
    return num_pixels

#Definición de la función ReLU
ReLU = lambda x: np.array([np.max([0,c]) for c in x.reshape(x.shape[0]*x.shape[1])]).reshape(x.shape[0],x.shape[1])


class Conv2D():
    """Capa de convolución (cross correlation)"""
    def __init__(self, kernel):
        np.random.seed(1)
        #Inicialización de parámetros
        self.w = np.random.random((kernel, kernel))/np.sqrt(kernel)
        self.b = np.random.random(1)
        
    def __call__(self, x):
        #Convolución
        self.x = x
        self.tgt_size = calculate_target_size(x.shape[0], self.w.shape[0])
        self.k = self.w.shape[0]
        self.h = np.zeros(shape=(self.tgt_size, self.tgt_size))
        for i in range(self.tgt_size):
            for j in range(self.tgt_size):
                x_ij = x[i:i+self.k, j:j+self.k]           
                self.h[i, j] = np.sum(self.w*x_ij) + self.b
        
        return ReLU(self.h)
        
    def backward(self, layer, lr=0.1):
        #Paso backward
        self.d = 0
        for i in range(self.tgt_size):
            for j in range(self.tgt_size):
                if self.h[i,j] > 0:
                    dw = (layer.d@x[i:i+self.k, j:j+self.k]).sum(2)
                    self.w -= lr*dw
                    self.b -= lr*dw.sum()
                    self.d += dw


class Pooling():
    """Aplicación de average pooling"""
    def __init__(self, size):
        #Tamaño de la ventana de pooling
        self.K, self.L = size, size
        
    def __call__(self, x):
        #Forward del pooling
        self.x = x
        self.M, self.N = x.shape
        self.MK = self.M // self.K
        self.NL = self.N // self.L
        self.h = x[:self.MK*self.K, :self.NL*self.L].reshape(self.MK, self.K, self.NL, self.L).mean(axis=(1, 3))

        return self.h
    
    def backward(self, layer):
        #Backward del poolin
        dh = self.h.reshape(self.MK*self.NL)/self.MK*self.NL
        self.d = np.outer(layer.d, dh).sum(0).reshape(self.MK, self.NL)


#Carga los datos
x,y = load_digits().data, load_digits().target
x = x.reshape(len(x),8,8)
#Genera entrenamiento y evaluación
x_train, x_test, y_train, y_test = train_test_split(x,y,test_size=0.3)


#Crea la gráfica de la red
conv = Conv2D(3)
pool = Pooling(2)
lin = Linear(9,10)
soft = Softmax()
risk = CrossEntropy()
#Hiperparámetros
lr = 0.1
epochs = 100
total_risk = []
for t in tqdm(range(epochs)):
    epoch_loss = 0
    for xi, yi in zip(x_train,y_train):
        #Forward
        h = conv(xi)
        pool_h = pool(h)
        flat_h = pool_h.reshape(9)
        f = soft(lin(flat_h))
        epoch_loss += risk(yi,f)
        
        #Backward
        risk.backward()
        soft.backward(risk)
        lin.backward(soft, lr=lr)
        pool.backward(lin)
        conv.backward(pool, lr=lr)
    total_risk.append(epoch_loss)

plt.plot(total_risk)

100%|█████████████████████████████████████████| 100/100 [03:39<00:00,  2.19s/it]

[<matplotlib.lines.Line2D at 0x7f8856a031c0>]


from sklearn.metrics import classification_report

#Predición en el test set
y_pred = [soft(lin(pool(conv(x_i)).reshape(9))).argmax() for x_i in x_test]
#Evaluación
print(classification_report(y_test, y_pred))

              precision    recall  f1-score   support

           0       0.91      1.00      0.95        48
           1       0.83      0.66      0.74        59
           2       0.89      1.00      0.94        62
           3       0.82      0.86      0.84        42
           4       0.90      0.84      0.87        63
           5       0.84      0.66      0.74        64
           6       0.83      0.95      0.88        55
           7       0.80      0.92      0.85        38
           8       0.84      0.73      0.78        51
           9       0.79      0.90      0.84        58

    accuracy                           0.84       540
   macro avg       0.84      0.85      0.84       540
weighted avg       0.84      0.84      0.84       540


def plot_images(images, num=2):
    """Visualización de imagenes"""
    _, axes = plt.subplots(nrows=1, ncols=num, figsize=(10, 3))
    for ax, image in zip(axes, images):
        #ax.set_axis_off()
        ax.imshow(image, cmap=plt.cm.gray_r, interpolation="nearest")
        
plot_images(x_test[:4], num=4)
plot_images([conv(xi) for xi in x_test[:4]], num=4)
plot_images([pool(conv(xi)) for xi in x_test[:4]], num=4)

Redes convolucionales¶

Funciones auxiliares¶

Capa convolucional¶

Pooling¶

Aplicación de la red convolucional¶

Datos¶

Entrenamiento¶

Evaluación¶

Ejercicio¶