Networks (#7)

* add networks * add networks plus tests * consistent order * fix coverage * bump version to 0.5.0 * Update network.py remove rollback gubbins * factor fit onto model * formatting * bump version to 0.6.0 * Comments removed, docstrings updated, code neater * some network tweaks * formatting --------- Co-authored-by: Will Handley <[email protected]>
handley-lab · Nov 6, 2023 · 1d986fc · 1d986fc
1 parent 4aeee8f
commit 1d986fc
Show file tree

Hide file tree

Showing 5 changed files with 301 additions and 3 deletions.
diff --git a/README.rst b/README.rst
@@ -2,8 +2,8 @@
 lsbi: Linear Simulation Based Inference
 =======================================
 :lsbi: Linear Simulation Based Inference
-:Author: Will Handley
-:Version: 0.5.1
+:Author: Will Handley & David Yallup
+:Version: 0.6.0
 :Homepage: https://github.com/handley-lab/lsbi
 :Documentation: http://lsbi.readthedocs.io/
 

diff --git a/lsbi/_version.py b/lsbi/_version.py
@@ -1 +1 @@
-__version__ = '0.5.1'
+__version__ = '0.6.0'
diff --git a/lsbi/network.py b/lsbi/network.py
@@ -0,0 +1,196 @@
+"""Simple binary classifiers to perform model comparison."""
+import torch
+import torch.nn as nn
+import torch.optim as optim
+from torch.optim.lr_scheduler import ExponentialLR
+
+
+class BinaryClassifierBase(nn.Module):
+    """Base model for binary classification. Following 2305.11241.
+
+    A simple binary classifier:
+    - 5 hidden layers
+        - Layer 1 with initial_dim units
+        - Layers 2-4 with internal_dim units
+    - Leaky ReLU activation function
+    - Batch normalization
+    - Output layer with 1 unit linear classifier unit
+    - Adam optimizer with default learning rate 0.001
+    - Exponential learning rate decay with default decay rate 0.95
+
+    Parameters
+    ----------
+    input_dim : int
+        Dimension of the input data.
+    internal_dim : int, optional (default=16)
+        Dimension of the internal layers of the network.
+    initial_dim : int, optional (default=130)
+        Dimension of the first layer of the network.
+    """
+
+    def __init__(self, input_dim, internal_dim=16, initial_dim=130):
+        super(BinaryClassifierBase, self).__init__()
+
+        self.model = nn.Sequential(
+            nn.Linear(input_dim, initial_dim),
+            nn.LeakyReLU(),
+            nn.BatchNorm1d(initial_dim),
+            nn.Linear(initial_dim, internal_dim),
+            nn.LeakyReLU(),
+            nn.BatchNorm1d(internal_dim),
+            nn.Linear(internal_dim, internal_dim),
+            nn.LeakyReLU(),
+            nn.BatchNorm1d(internal_dim),
+            nn.Linear(internal_dim, internal_dim),
+            nn.LeakyReLU(),
+            nn.BatchNorm1d(internal_dim),
+            nn.Linear(internal_dim, internal_dim),
+            nn.LeakyReLU(),
+            nn.Linear(internal_dim, 1),
+        )
+
+    def forward(self, x):
+        """Forward pass through the network, logit output."""
+        return self.model(x)
+
+    def loss(self, x, y):
+        """Loss function for the network."""
+        raise NotImplementedError
+
+    def predict(self, x):
+        """Predict the Bayes Factor."""
+        raise NotImplementedError
+
+    def fit(self, X, y, **kwargs):
+        """Fit classifier on input features X to predict labels y.
+
+        Parameters
+        ----------
+        X : array-like, shape (n_samples, n_features)
+            Input data.
+        y : array-like, shape (n_samples,)
+            Target values.
+        num_epochs : int, optional (default=10)
+            Number of epochs to train the network.
+        batch_size : int, optional (default=128)
+            Batch size for training.
+        decay_rate : float, optional (default=0.95)
+            Decay rate for the learning rate scheduler.
+        lr : float, optional (default=0.001)
+            Learning rate for the optimizer.
+        device : str, optional (default="cpu")
+            Device to use for training.
+        """
+        num_epochs = kwargs.get("num_epochs", 10)
+        batch_size = kwargs.get("batch_size", 128)
+        decay_rate = kwargs.get("decay_rate", 0.95)
+        lr = kwargs.get("lr", 0.001)
+        device = torch.device(kwargs.get("device", "cpu"))
+
+        print("Using device: ", device)
+
+        # Convert labels to torch tensor
+        X = torch.tensor(X, dtype=torch.float32)
+        labels = torch.tensor(y, dtype=torch.float32)
+        labels = labels.unsqueeze(1)
+        labels = labels.to(device)
+
+        # Create a DataLoader for batch training
+        dataset = torch.utils.data.TensorDataset(X, labels)
+        dataloader = torch.utils.data.DataLoader(
+            dataset, batch_size=batch_size, shuffle=True
+        )
+
+        # Define the loss function and optimizer
+        criterion = self.loss
+        optimizer = optim.Adam(self.parameters(), lr=lr)
+
+        # Create the scheduler and pass in the optimizer and decay rate
+        scheduler = ExponentialLR(optimizer, gamma=decay_rate)
+
+        # Create a DataLoader for batch training
+        self.to(device=device, dtype=torch.float32)
+
+        for epoch in range(num_epochs):
+            epoch_loss = []
+            for i, (inputs, targets) in enumerate(dataloader):
+                # Clear gradients
+                optimizer.zero_grad()
+                inputs = inputs.to(device)
+                # Forward pass
+                loss = criterion(inputs, targets)
+                epoch_loss.append(loss.item())
+                # Backward pass and optimize
+                loss.backward()
+                optimizer.step()
+
+            # Print loss for every epoch
+            scheduler.step()
+            mean_loss = torch.mean(torch.tensor(epoch_loss)).item()
+            print(f"Epoch {epoch+1}/{num_epochs}, Loss: {mean_loss}")
+
+        # once training is done, set the model to eval(), ensures batchnorm
+        # and dropout are not used during inference
+        self.model.eval()
+
+
+class BinaryClassifier(BinaryClassifierBase):
+    """
+    Extends the BinaryClassifierBase to use a BCE loss function.
+
+    Furnishes with a direction prediction of the Bayes Factor.
+    """
+
+    def loss(self, x, y):
+        """Binary cross entropy loss function for the network."""
+        y_ = self.forward(x)
+        return nn.BCEWithLogitsLoss()(y_, y)
+
+    def predict(self, x):
+        """Predict the log Bayes Factor.
+
+        log K = lnP(Class 1) - lnP(Class 0)
+        """
+        x = torch.tensor(x, dtype=torch.float32)
+        pred = self.forward(x)
+        pred = nn.Sigmoid()(pred)
+        return (torch.log(pred) - torch.log(1 - pred)).detach().numpy()
+
+
+class BinaryClassifierLPop(BinaryClassifierBase):
+    """
+    Extends the BinaryClassifierBase to use a LPop Exponential loss.
+
+    Furnishes with a direction prediction of the Bayes Factor.
+
+    Parameters
+    ----------
+    alpha : float, optional (default=2.0)
+        Scale factor for the exponent transform.
+    """
+
+    def __init__(self, *args, **kwargs):
+        self.alpha = kwargs.pop("alpha", 2.0)
+        super(BinaryClassifierLPop, self).__init__(*args, **kwargs)
+
+    def lpop(self, x):
+        """Leaky parity odd power transform."""
+        return x + x * torch.pow(torch.abs(x), self.alpha - 1.0)
+
+    def loss(self, x, y):
+        """Lpop Loss function for the network."""
+        x = self.forward(x)
+        return torch.exp(
+            torch.logsumexp((0.5 - y) * self.lpop(x), dim=0)
+            - torch.log(torch.tensor(x.shape[0], dtype=torch.float64))
+        ).squeeze()
+
+    def predict(self, x):
+        """Predict the log Bayes Factor.
+
+        log K = lnP(Class 1) - lnP(Class 0)
+        """
+        x = torch.tensor(x, dtype=torch.float32)
+        pred = self.forward(x)
+        pred = self.lpop(pred)
+        return pred.detach().numpy()
diff --git a/pyproject.toml b/pyproject.toml
@@ -7,6 +7,7 @@ name = "lsbi"
 dynamic = ["version"]
 authors = [
     { name="Will Handley", email="[email protected]" },
+    { name="David Yallup", email="[email protected]" },
 ]
 description = "Linear Simulation Based Inference"
 readme = "README.rst"
@@ -16,6 +17,7 @@ dependencies = [
     'numpy',
     'scipy',
     'matplotlib',
+    'torch',
 ]
 classifiers = [
     "Programming Language :: Python :: 3",

diff --git a/tests/test_networks.py b/tests/test_networks.py
@@ -0,0 +1,100 @@
+from lsbi.network import (
+    BinaryClassifierBase,
+    BinaryClassifier,
+    BinaryClassifierLPop,
+)
+import torch
+import numpy as np
+import pytest
+
+
+@pytest.mark.parametrize("input_dim", [1, 100])
+@pytest.mark.parametrize("internal_dim", [16, 32])
+@pytest.mark.parametrize("initial_dim", [130, 256])
+class TestClassifierBase:
+    CLS = BinaryClassifierBase
+
+    @pytest.fixture
+    def model(self, input_dim, internal_dim, initial_dim):
+        return self.CLS(input_dim, internal_dim, initial_dim)
+
+    @pytest.fixture
+    def x(self, input_dim):
+        return torch.tensor(np.random.rand(10, input_dim), dtype=torch.float32)
+
+    @pytest.fixture
+    def y(self):
+        return torch.tensor(
+            np.random.randint(0, 2, size=(10, 1)), dtype=torch.float32
+        )
+
+    def fit_model(self, model, input_dim):
+        data_size = 10
+        data = np.random.rand(data_size, input_dim)
+        labels = np.random.randint(0, 2, size=(data_size))
+        y_start = model.predict(data)
+        model.fit(data, labels, num_epochs=1)
+        y_end = model.predict(data)
+        return y_start, y_end
+
+    def test_init(self, model):
+        assert isinstance(model, BinaryClassifierBase)
+
+    def test_forward(self, model, x):
+        y = model.forward(x)
+        assert y.shape == (10, 1)
+
+    def test_loss(self, model, x, y):
+        with pytest.raises(NotImplementedError):
+            model.loss(x, y)
+
+    def test_predict(self, model, x):
+        with pytest.raises(NotImplementedError):
+            model.predict(x)
+
+    def test_fit(self, model, x):
+        with pytest.raises(NotImplementedError):
+            y_start, y_end = self.fit_model(model, x.shape[1])
+
+
+class TestClassifier(TestClassifierBase):
+    CLS = BinaryClassifier
+
+    def test_loss(self, model, x, y):
+        loss = model.loss(x, y)
+        assert loss.detach().numpy().shape == ()
+
+    @pytest.mark.filterwarnings("ignore::UserWarning")
+    def test_predict(self, model, x):
+        y = model.predict(x)
+        assert y.shape == (10, 1)
+        assert isinstance(y, np.ndarray)
+
+    @pytest.mark.filterwarnings("ignore::UserWarning")
+    def test_fit(self, model, x):
+        y_start, y_end = self.fit_model(model, x.shape[1])
+        assert (y_start != y_end).any()
+
+
+@pytest.mark.parametrize("alpha", [2, 5])
+class TestClassifierLPop(TestClassifierBase):
+    CLS = BinaryClassifierLPop
+
+    @pytest.fixture
+    def model(self, input_dim, internal_dim, initial_dim, alpha):
+        return self.CLS(input_dim, internal_dim, initial_dim, alpha=alpha)
+
+    def test_loss(self, model, x, y):
+        loss = model.loss(x, y)
+        assert loss.detach().numpy().shape == ()
+
+    @pytest.mark.filterwarnings("ignore::UserWarning")
+    def test_predict(self, model, x):
+        y = model.predict(x)
+        assert y.shape == (10, 1)
+        assert isinstance(y, np.ndarray)
+
+    @pytest.mark.filterwarnings("ignore::UserWarning")
+    def test_fit(self, model, x):
+        y_start, y_end = self.fit_model(model, x.shape[1])
+        assert (y_start != y_end).any()