Source code for csle_common.models.fnn_w_softmax

"""
A FNN model with Softmax output defined in PyTorch
"""
import torch


[docs]class FNNwithSoftmax(torch.nn.Module): """ Implements a FNN with parameterizable number of layers, dimensions, and hidden activations. Sub-classing the torch.nn.Module to be able to use high-level API for creating the custom network """ def __init__(self, input_dim: int, output_dim: int, hidden_dim: int, num_hidden_layers: int = 2, hidden_activation: str = "ReLU"): """ Builds the model :param input_dim: the input dimension :param output_dim: the output dimension :param hidden_dim: the hidden dimension :param num_hidden_layers: the number of hidden layers :param hidden_activation: hidden activation type """ super(FNNwithSoftmax, self).__init__() self.input_dim = input_dim self.output_dim = output_dim self.hidden_dim = hidden_dim self.num_hidden_layers = num_hidden_layers self.num_layers = num_hidden_layers + 2 self.hidden_activation = hidden_activation # Define layers of FNN self.layers = torch.nn.ModuleList() # Input layer self.layers.append(torch.nn.Linear(input_dim, hidden_dim)) self.layers.append(self.get_hidden_activation()) # Hidden Layers for i in range(self.num_hidden_layers): self.layers.append(torch.nn.Linear(hidden_dim, hidden_dim)) self.layers.append(self.get_hidden_activation()) # Output layer self.layers.append(torch.nn.Linear(hidden_dim, self.output_dim)) self.layers.append(torch.nn.Softmax())
[docs] def get_hidden_activation(self): """ Interprets the hidden activation :return: the hidden activation function """ if self.hidden_activation == "ReLU": return torch.nn.ReLU() elif self.hidden_activation == "LeakyReLU": return torch.nn.LeakyReLU() elif self.hidden_activation == "LogSigmoid": return torch.nn.LogSigmoid() elif self.hidden_activation == "PReLU": return torch.nn.PReLU() elif self.hidden_activation == "Sigmoid": return torch.nn.Sigmoid() elif self.hidden_activation == "Softplus": return torch.nn.Softplus() elif self.hidden_activation == "Tanh": return torch.nn.Tanh() else: raise ValueError("Activation type: {} not recognized".format(self.hidden_activation))
[docs] def forward(self, x): """ Forward propagation :param x: input tensor :return: Output prediction """ y = x for i in range(len(self.layers)): y = self.layers[i](y) return y
[docs]def test() -> None: """ A basic test-case to verify that the model can fit some randomly generated data :return: None """ # Constants input_dim = 44 output_dim = 44 hidden_dim = 64 batch_size = 64 # Create model model = FNNwithSoftmax(input_dim, output_dim, hidden_dim, num_hidden_layers=2) # Create random Tensors to hold inputs and outputs x = torch.randn(batch_size, input_dim) y = torch.empty(batch_size, dtype=torch.long).random_(output_dim) # Construct our loss function and an Optimizer. The call to model.parameters() # in the SGD constructor will contain the learnable parameters of the layers in the model criterion = torch.nn.CrossEntropyLoss(reduction='sum') optimizer = torch.optim.SGD(model.parameters(), lr=1e-4) for t in range(20000): # Forward pass: Compute predicted y by passing x to the model y_pred = model(x) # Compute and print loss loss = criterion(y_pred, y.squeeze()) if t % 100 == 99: print("step: {}, loss:{}".format(t, loss.item())) # Zero gradients, perform a backward pass, and update the weights. optimizer.zero_grad() loss.backward() optimizer.step()
if __name__ == '__main__': test()