Source code for autoqild.mi_estimators.neural_networks_torch

"""Neural Nwtowkr implementations for running the PC-softmax and Mine MI
estimator."""

import torch
import torch.nn.functional as F
from torch import nn

from autoqild.mi_estimators.pytorch_utils import own_softmax



[docs]
class ClassNet(nn.Module):
    """ClassNet is a fully connected neural network used for classification
    tasks.

    This class implements a simple feedforward neural network with a configurable number of hidden layers and units.
    It supports a custom softmax function (PC-softmax) for handling imbalanced data.

    Parameters
    ----------
    in_dim : int
        Number of input features.
    out_dim : int
        Number of output classes.
    n_units : int
        Number of units in each hidden layer.
    n_hidden : int
        Number of hidden layers.
    device : torch.device
        Device to run the network on (CPU or GPU).
    is_pc_softmax : bool, optional, default=True
        If True, use the custom PC-softmax function in the final layer.

    Attributes
    ----------
    input : torch.nn.Linear
        Input layer.
    hidden_layers : list of torch.nn.Linear
        Hidden layers.
    output : torch.nn.Linear
        Output layer.
    is_pc_softmax : bool
        Whether to use the PC-softmax function.
    device : torch.device
        Device used for computation.
    """

    def __init__(self, in_dim, out_dim, n_units, n_hidden, device, is_pc_softmax=True):
        super(ClassNet, self).__init__()
        self.input = nn.Linear(in_dim, n_units)
        self.hidden_layers = [nn.Linear(n_units, n_units) for _ in range(n_hidden - 1)]
        self.output = nn.Linear(n_units, out_dim)
        self.is_pc_softmax = is_pc_softmax
        self.device = device


[docs]
    def forward(self, x_in, label_proportions):
        """Forward pass through the network.

        Parameters
        ----------
        x_in : torch.Tensor
            Input tensor.
        label_proportions : list or torch.Tensor
            Proportions of each class in the dataset.

        Returns
        -------
        x_in : torch.Tensor
            Output tensor after applying the network layers.
        """
        x_in = torch.relu(self.input(x_in))
        for i, hidden in enumerate(self.hidden_layers):
            x_in = torch.relu(hidden(x_in))
        x_in = self.output(x_in)
        if label_proportions is not None and self.is_pc_softmax:
            x_in = torch.log(own_softmax(x_in, label_proportions, self.device) + 1e-6)
        else:
            x_in = torch.log(F.softmax(x_in, dim=1) + 1e-6)
        return x_in



[docs]
    def score(self, x_in, label_proportions):
        """Compute class probabilities for the input samples.

        Parameters
        ----------
        x_in : torch.Tensor
            Input tensor.
        label_proportions : list or torch.Tensor
            Proportions of each class in the dataset.

        Returns
        -------
        x_in : torch.Tensor
            Output tensor with class probabilities.
        """
        x_in = torch.relu(self.input(x_in))
        for i, hidden in enumerate(self.hidden_layers):
            x_in = torch.relu(hidden(x_in))
        x_in = self.output(x_in)
        x_in = F.softmax(x_in, dim=1)
        return x_in





[docs]
class StatNet(nn.Module):
    """StatNet is a fully connected neural network used for statistical
    modeling in MINE (Mutual Information Neural Estimation) tasks to estimate
    mutual information.

    This class implements a simple feedforward neural network with a configurable number of hidden layers and units.
    It is typically used to model the joint distribution of input features and class labels for MI estimation.

    Parameters
    ----------
    in_dim : int
        Number of input features.
    cls_enc : int, optional, default=1
        Number of classes in the one-hot encoded target variable.
    n_units : int, optional, default=100
        Number of units in each hidden layer.
    n_hidden : int, optional, default=1
        Number of hidden layers.
    device : torch.device, optional, default=`cpu`
        Device to run the network on (CPU or GPU).

    Attributes
    ----------
    input : torch.nn.Linear
        Input layer.
    hidden_layers : list of torch.nn.Linear
        Hidden layers.
    output : torch.nn.Linear
        Output layer.
    """

    def __init__(self, in_dim, cls_enc=1, n_units=100, n_hidden=1, device="cpu"):
        super(StatNet, self).__init__()
        self.device = device
        self.input = nn.Linear(in_dim + cls_enc, n_units).to(self.device)
        self.hidden_layers = [
            nn.Linear(n_units, n_units).to(self.device) for _ in range(n_hidden - 1)
        ]
        self.output = nn.Linear(n_units, 1).to(self.device)


[docs]
    def forward(self, x_in):
        """Forward pass through the network.

        Parameters
        ----------
        x_in : torch.Tensor
            Input tensor.

        Returns
        -------
        x_in : torch.Tensor
            Output tensor after applying the network layers.
        """
        x_in = x_in.to(self.device)
        x_in = torch.relu(self.input(x_in))
        for i, hidden in enumerate(self.hidden_layers):
            x_in = torch.relu(hidden(x_in))
        x_in = self.output(x_in)
        return x_in