%matplotlib inline

import numpy as np
import matplotlib.pyplot as plt
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.nn.utils.prune as prune


class LeNet(nn.Module):
    def __init__(self, in_channels=1, n_outputs=10):
        super(LeNet, self).__init__()
        
        self.conv1 = nn.Conv2d(in_channels, 8, kernel_size=3)
        self.conv2 = nn.Conv2d(8, 16, kernel_size=3)
        self.pool = nn.MaxPool2d(kernel_size=2)
        self.fc1 = nn.Linear(16*3*3, 128)
        self.fc2 = nn.Linear(128, 64)
        self.fc3 = nn.Linear(64, n_outputs)
        
    def forward(self, x):
        x = self.pool(F.relu(self.conv1(x)))
        x = self.pool(F.relu(self.conv2(x)))
        x = x.view(x.size(0), -1)
        x = F.relu(self.fc1(x))
        x = F.relu(self.fc2(x))
        x = self.fc3(x)
        
        return x
    
model = LeNet()


# Shape of the weights
print(model.conv1.weight.shape)

# Weights for the first convolutional filter
print(model.conv1.weight[0])

torch.Size([8, 1, 3, 3])
tensor([[[ 0.2198, -0.2798, -0.0328],
         [ 0.2983,  0.2103, -0.0328],
         [-0.2682,  0.0169,  0.2760]]], grad_fn=<SelectBackward0>)


def plot_filters(weights, num_cols=4):
    weights = weights.detach().numpy()
    num_filters = weights.shape[0]
    num_rows = int(num_filters / num_cols)
    
    fig, axs = plt.subplots(num_rows, num_cols, figsize=(num_cols*2,num_rows*2))

    for i in range(num_filters):
        axs[int(i / num_cols), i % num_cols].matshow(weights[i, 0, :, :], cmap="RdBu", vmin=-0.5, vmax=0.5)
        axs[int(i / num_cols), i % num_cols].set(xticklabels=[], yticklabels=[], xticks=[], yticks=[])
        for (j,k), w in np.ndenumerate(weights[i, 0, :, :]):
            axs[int(i / num_cols), i % num_cols].text(k, j, format(w, "0.2f"), ha="center", va="center")
        
plot_filters(model.conv1.weight)


prune.random_unstructured(model.conv1, name="weight", amount=0.5)

Conv2d(1, 8, kernel_size=(3, 3), stride=(1, 1))


print(model.conv1.weight_orig[0])
print(model.conv1.weight_mask[0])
print(model.conv1.weight[0])

tensor([[[ 0.2198, -0.2798, -0.0328],
         [ 0.2983,  0.2103, -0.0328],
         [-0.2682,  0.0169,  0.2760]]], grad_fn=<SelectBackward0>)
tensor([[[0., 0., 0.],
         [0., 1., 1.],
         [1., 0., 1.]]])
tensor([[[ 0.0000, -0.0000, -0.0000],
         [ 0.0000,  0.2103, -0.0328],
         [-0.2682,  0.0000,  0.2760]]], grad_fn=<SelectBackward0>)


plot_filters(model.conv1.weight)


def reset_pruning(module):
    module.weight_mask = torch.ones(module.weight.shape)
    prune.remove(module, name="weight")

reset_pruning(model.conv1)


print(model.conv1.weight[0])

tensor([[[ 0.2198, -0.2798, -0.0328],
         [ 0.2983,  0.2103, -0.0328],
         [-0.2682,  0.0169,  0.2760]]], grad_fn=<SelectBackward0>)


# Prune entire filters
prune.random_structured(model.conv1, name="weight", amount=0.5, dim=0)
plot_filters(model.conv1.weight)
reset_pruning(model.conv1)


# Prune rows
prune.random_structured(model.conv1, name="weight", amount=0.3, dim=2)
plot_filters(model.conv1.weight)
reset_pruning(model.conv1)


# Prune columns
prune.random_structured(model.conv1, name="weight", amount=0.3, dim=3)
plot_filters(model.conv1.weight)
reset_pruning(model.conv1)

Overview¶