Mnist module

Mnist simple model.

`MNISTLitModule` #

Bases: LightningModule

Example of a LightningModule for MNIST classification.

A LightningModule implements 8 key methods:

def __init__(self):
# Define initialization code here.

def setup(self, stage):
# Things to setup before each stage, 'fit', 'validate', 'test', 'predict'.
# This hook is called on every process when using DDP.

def training_step(self, batch, batch_idx):
# The complete training step.

def validation_step(self, batch, batch_idx):
# The complete validation step.

def test_step(self, batch, batch_idx):
# The complete test step.

def predict_step(self, batch, batch_idx):
# The complete predict step.

def configure_optimizers(self):
# Define and configure optimizers and LR schedulers.

Docs

https://lightning.ai/docs/pytorch/latest/common/lightning_module.html

Source code in src/models/mnist_module.py

class MNISTLitModule(LightningModule):
    """Example of a `LightningModule` for MNIST classification.

    A `LightningModule` implements 8 key methods:

    ```python
    def __init__(self):
    # Define initialization code here.

    def setup(self, stage):
    # Things to setup before each stage, 'fit', 'validate', 'test', 'predict'.
    # This hook is called on every process when using DDP.

    def training_step(self, batch, batch_idx):
    # The complete training step.

    def validation_step(self, batch, batch_idx):
    # The complete validation step.

    def test_step(self, batch, batch_idx):
    # The complete test step.

    def predict_step(self, batch, batch_idx):
    # The complete predict step.

    def configure_optimizers(self):
    # Define and configure optimizers and LR schedulers.
    ```

    Docs:
        https://lightning.ai/docs/pytorch/latest/common/lightning_module.html
    """

    def __init__(
        self,
        net: torch.nn.Module,
        optimizer: torch.optim.Optimizer,
        scheduler: torch.optim.lr_scheduler._LRScheduler | None,
        compile_model: bool,
    ) -> None:
        """Initialize a `MNISTLitModule`.

        Args:
            net: The model to train.
            optimizer: The optimizer to use for training.
            scheduler: The learning rate scheduler to use for training.
            compile_model: Whether or not compile the model.
        """
        super().__init__()

        # this line allows to access init params with 'self.hparams' attribute
        # also ensures init params will be stored in ckpt
        self.save_hyperparameters(logger=False)

        self.net = net

        # loss function
        self.criterion = torch.nn.CrossEntropyLoss()

        # metric objects for calculating and averaging accuracy across batches
        self.train_acc = Accuracy(task="multiclass", num_classes=10)
        self.val_acc = Accuracy(task="multiclass", num_classes=10)
        self.test_acc = Accuracy(task="multiclass", num_classes=10)

        # for averaging loss across batches
        self.train_loss = MeanMetric()
        self.val_loss = MeanMetric()
        self.test_loss = MeanMetric()

        # for tracking best so far validation accuracy
        self.val_acc_best = MaxMetric()

    @typechecked
    def forward(self, x: TensorType[Batch, 1, 28, 28]) -> TensorType[Batch, 10]:  # ty
        """Perform a forward pass through the model.

        Args:
            x: A tensor of shape (batch_size, 1, 28, 28) representing the MNIST images.

        Returns:
            A tensor of shape (batch_size, 10) representing the logits for each class.
        """
        return self.net(x)

    def on_train_start(self) -> None:
        """Lightning hook that is called when training begins."""
        # by default lightning executes validation step sanity checks before training starts,
        # so it's worth to make sure validation metrics don't store results from these checks
        self.val_loss.reset()
        self.val_acc.reset()
        self.val_acc_best.reset()

    @typechecked
    def model_step(
        self, x: TensorType[Batch, 1, 28, 28], y: TensorType[Batch]
    ) -> tuple[TensorType[()], TensorType[()], TensorType[()]]:
        """Perform a single model step.

        Args:
            x: Tensor of shape [batch, 1, 28, 28] representing the images.
            y: Tensor of shape [batch] representing the classes.

        Returns:
            A tuple containing:
                - loss: A tensor of shape (batch_size,)
                - preds: A tensor of predicted class indices (batch_size,)
                - targets: A tensor of true class labels (batch_size,)
        """
        logits = self.forward(x)
        loss = self.criterion(logits, y)
        preds = torch.argmax(logits, dim=1)
        return loss, preds, y

    @typechecked
    def training_step(self, batch: Any, batch_idx: int) -> TensorType[()]:
        """Perform a single training step.

        Args:
            batch: A tuple containing input images and target labels.
            batch_idx: The index of the current batch.

        Returns:
            A scalar loss tensor.
        """
        x, y = batch
        loss, preds, targets = self.model_step(x, y)
        self.train_loss(loss)
        self.train_acc(preds, targets)
        self.log("train/loss", self.train_loss, on_step=False, on_epoch=True, prog_bar=True)
        self.log("train/acc", self.train_acc, on_step=False, on_epoch=True, prog_bar=True)
        return loss

    def on_train_epoch_end(self) -> None:
        """Lightning hook that is called when a training epoch ends."""
        pass

    def validation_step(self, batch: tuple[torch.Tensor, torch.Tensor], batch_idx: int) -> None:
        """Perform a single validation step on a batch of data from the validation set.

        Args:
            batch: A batch of data (a tuple) containing the input tensor of images and target
                labels.
            batch_idx: The index of the current batch.
        """
        x, y = batch
        loss, preds, targets = self.model_step(x, y)

        # update and log metrics
        self.val_loss(loss)
        self.val_acc(preds, targets)
        self.log("val/loss", self.val_loss, on_step=False, on_epoch=True, prog_bar=True)
        self.log("val/acc", self.val_acc, on_step=False, on_epoch=True, prog_bar=True)

    def on_validation_epoch_end(self) -> None:
        """Lightning hook that is called when a validation epoch ends."""
        # get current val acc
        acc = self.val_acc.compute()  # type: ignore
        self.val_acc_best(acc)  # update best so far val acc
        # log `val_acc_best` as a value through `.compute()` method, instead of as a metric object
        # otherwise metric would be reset by lightning after each epoch
        self.log("val/acc_best", self.val_acc_best.compute(), sync_dist=True, prog_bar=True)

    def test_step(self, batch: tuple[torch.Tensor, torch.Tensor], batch_idx: int) -> None:
        """Perform a single test step on a batch of data from the test set.

        Args:
            batch: A batch of data (a tuple) containing the input tensor of images and target
                labels.
            batch_idx: The index of the current batch.
        """
        x, y = batch
        loss, preds, targets = self.model_step(x, y)

        # update and log metrics
        self.test_loss(loss)
        self.test_acc(preds, targets)
        self.log("test/loss", self.test_loss, on_step=False, on_epoch=True, prog_bar=True)
        self.log("test/acc", self.test_acc, on_step=False, on_epoch=True, prog_bar=True)

    def on_test_epoch_end(self) -> None:
        """Lightning hook that is called when a test epoch ends."""
        pass

    def setup(self, stage: str) -> None:
        """Lightning hook that is called at the beginning of fit (train + validate), validate, test, or predict.

        This is a good hook when you need to build models dynamically or adjust something about
        them. This hook is called on every process when using DDP.

        Args:
            stage: Either `"fit"`, `"validate"`, `"test"`, or `"predict"`.
        """
        if self.hparams["compile_model"] and stage == "fit":
            self.net = torch.compile(self.net)  # type: ignore

    def configure_optimizers(self) -> dict[str, Any]:  # type: ignore
        """Choose what optimizers and learning-rate schedulers to use in your optimization.

        Normally you'd need one. But in the case of GANs or similar you might have multiple.

        Examples:
            https://lightning.ai/docs/pytorch/latest/common/lightning_module.html#configure-optimizers

        Returns:
            A dict containing the configured optimizers and learning-rate schedulers to be used for training.
        """
        assert self.trainer.model is not None, "Model is not compiled yet."
        optimizer = self.hparams["optimizer"](params=self.trainer.model.parameters())
        if self.hparams["scheduler"] is not None:
            scheduler = self.hparams["scheduler"](optimizer=optimizer)
            return {
                "optimizer": optimizer,
                "lr_scheduler": {
                    "scheduler": scheduler,
                    "monitor": "val/loss",
                    "interval": "epoch",
                    "frequency": 1,
                },
            }
        return {"optimizer": optimizer}

`init(net, optimizer, scheduler, compile_model)` #

Initialize a MNISTLitModule.

Parameters:

Name	Type	Description	Default
`net`	`Module`	The model to train.	required
`optimizer`	`Optimizer`	The optimizer to use for training.	required
`scheduler`	`_LRScheduler \| None`	The learning rate scheduler to use for training.	required
`compile_model`	`bool`	Whether or not compile the model.	required

Source code in src/models/mnist_module.py

def __init__(
    self,
    net: torch.nn.Module,
    optimizer: torch.optim.Optimizer,
    scheduler: torch.optim.lr_scheduler._LRScheduler | None,
    compile_model: bool,
) -> None:
    """Initialize a `MNISTLitModule`.

    Args:
        net: The model to train.
        optimizer: The optimizer to use for training.
        scheduler: The learning rate scheduler to use for training.
        compile_model: Whether or not compile the model.
    """
    super().__init__()

    # this line allows to access init params with 'self.hparams' attribute
    # also ensures init params will be stored in ckpt
    self.save_hyperparameters(logger=False)

    self.net = net

    # loss function
    self.criterion = torch.nn.CrossEntropyLoss()

    # metric objects for calculating and averaging accuracy across batches
    self.train_acc = Accuracy(task="multiclass", num_classes=10)
    self.val_acc = Accuracy(task="multiclass", num_classes=10)
    self.test_acc = Accuracy(task="multiclass", num_classes=10)

    # for averaging loss across batches
    self.train_loss = MeanMetric()
    self.val_loss = MeanMetric()
    self.test_loss = MeanMetric()

    # for tracking best so far validation accuracy
    self.val_acc_best = MaxMetric()

`configure_optimizers()` #

Choose what optimizers and learning-rate schedulers to use in your optimization.

Normally you'd need one. But in the case of GANs or similar you might have multiple.

Examples:

https://lightning.ai/docs/pytorch/latest/common/lightning_module.html#configure-optimizers

Returns:

Type	Description
`dict[str, Any]`	A dict containing the configured optimizers and learning-rate schedulers to be used for training.

Source code in src/models/mnist_module.py

def configure_optimizers(self) -> dict[str, Any]:  # type: ignore
    """Choose what optimizers and learning-rate schedulers to use in your optimization.

    Normally you'd need one. But in the case of GANs or similar you might have multiple.

    Examples:
        https://lightning.ai/docs/pytorch/latest/common/lightning_module.html#configure-optimizers

    Returns:
        A dict containing the configured optimizers and learning-rate schedulers to be used for training.
    """
    assert self.trainer.model is not None, "Model is not compiled yet."
    optimizer = self.hparams["optimizer"](params=self.trainer.model.parameters())
    if self.hparams["scheduler"] is not None:
        scheduler = self.hparams["scheduler"](optimizer=optimizer)
        return {
            "optimizer": optimizer,
            "lr_scheduler": {
                "scheduler": scheduler,
                "monitor": "val/loss",
                "interval": "epoch",
                "frequency": 1,
            },
        }
    return {"optimizer": optimizer}

`forward(x)` #

Perform a forward pass through the model.

Parameters:

Name	Type	Description	Default
`x`	`TensorType[Batch, 1, 28, 28]`	A tensor of shape (batch_size, 1, 28, 28) representing the MNIST images.	required

Returns:

Type	Description
`TensorType[Batch, 10]`	A tensor of shape (batch_size, 10) representing the logits for each class.

Source code in src/models/mnist_module.py

@typechecked
def forward(self, x: TensorType[Batch, 1, 28, 28]) -> TensorType[Batch, 10]:  # ty
    """Perform a forward pass through the model.

    Args:
        x: A tensor of shape (batch_size, 1, 28, 28) representing the MNIST images.

    Returns:
        A tensor of shape (batch_size, 10) representing the logits for each class.
    """
    return self.net(x)

`model_step(x, y)` #

Perform a single model step.

Parameters:

Name	Type	Description	Default
`x`	`TensorType[Batch, 1, 28, 28]`	Tensor of shape [batch, 1, 28, 28] representing the images.	required
`y`	`TensorType[Batch]`	Tensor of shape [batch] representing the classes.	required

Returns:

Type	Description
`tuple[TensorType[], TensorType[], TensorType[]]`	A tuple containing: - loss: A tensor of shape (batch_size,) - preds: A tensor of predicted class indices (batch_size,) - targets: A tensor of true class labels (batch_size,)

Source code in src/models/mnist_module.py

@typechecked
def model_step(
    self, x: TensorType[Batch, 1, 28, 28], y: TensorType[Batch]
) -> tuple[TensorType[()], TensorType[()], TensorType[()]]:
    """Perform a single model step.

    Args:
        x: Tensor of shape [batch, 1, 28, 28] representing the images.
        y: Tensor of shape [batch] representing the classes.

    Returns:
        A tuple containing:
            - loss: A tensor of shape (batch_size,)
            - preds: A tensor of predicted class indices (batch_size,)
            - targets: A tensor of true class labels (batch_size,)
    """
    logits = self.forward(x)
    loss = self.criterion(logits, y)
    preds = torch.argmax(logits, dim=1)
    return loss, preds, y

`on_test_epoch_end()` #

Lightning hook that is called when a test epoch ends.

Source code in src/models/mnist_module.py

def on_test_epoch_end(self) -> None:
    """Lightning hook that is called when a test epoch ends."""
    pass

`on_train_epoch_end()` #

Lightning hook that is called when a training epoch ends.

Source code in src/models/mnist_module.py

def on_train_epoch_end(self) -> None:
    """Lightning hook that is called when a training epoch ends."""
    pass

`on_train_start()` #

Lightning hook that is called when training begins.

Source code in src/models/mnist_module.py

def on_train_start(self) -> None:
    """Lightning hook that is called when training begins."""
    # by default lightning executes validation step sanity checks before training starts,
    # so it's worth to make sure validation metrics don't store results from these checks
    self.val_loss.reset()
    self.val_acc.reset()
    self.val_acc_best.reset()

`on_validation_epoch_end()` #

Lightning hook that is called when a validation epoch ends.

Source code in src/models/mnist_module.py

def on_validation_epoch_end(self) -> None:
    """Lightning hook that is called when a validation epoch ends."""
    # get current val acc
    acc = self.val_acc.compute()  # type: ignore
    self.val_acc_best(acc)  # update best so far val acc
    # log `val_acc_best` as a value through `.compute()` method, instead of as a metric object
    # otherwise metric would be reset by lightning after each epoch
    self.log("val/acc_best", self.val_acc_best.compute(), sync_dist=True, prog_bar=True)

`setup(stage)` #

Lightning hook that is called at the beginning of fit (train + validate), validate, test, or predict.

This is a good hook when you need to build models dynamically or adjust something about them. This hook is called on every process when using DDP.

Parameters:

Name	Type	Description	Default
`stage`	`str`	Either `"fit"`, `"validate"`, `"test"`, or `"predict"`.	required

Source code in src/models/mnist_module.py

def setup(self, stage: str) -> None:
    """Lightning hook that is called at the beginning of fit (train + validate), validate, test, or predict.

    This is a good hook when you need to build models dynamically or adjust something about
    them. This hook is called on every process when using DDP.

    Args:
        stage: Either `"fit"`, `"validate"`, `"test"`, or `"predict"`.
    """
    if self.hparams["compile_model"] and stage == "fit":
        self.net = torch.compile(self.net)  # type: ignore

`test_step(batch, batch_idx)` #

Perform a single test step on a batch of data from the test set.

Parameters:

Name	Type	Description	Default
`batch`	`tuple[Tensor, Tensor]`	A batch of data (a tuple) containing the input tensor of images and target labels.	required
`batch_idx`	`int`	The index of the current batch.	required

Source code in src/models/mnist_module.py

def test_step(self, batch: tuple[torch.Tensor, torch.Tensor], batch_idx: int) -> None:
    """Perform a single test step on a batch of data from the test set.

    Args:
        batch: A batch of data (a tuple) containing the input tensor of images and target
            labels.
        batch_idx: The index of the current batch.
    """
    x, y = batch
    loss, preds, targets = self.model_step(x, y)

    # update and log metrics
    self.test_loss(loss)
    self.test_acc(preds, targets)
    self.log("test/loss", self.test_loss, on_step=False, on_epoch=True, prog_bar=True)
    self.log("test/acc", self.test_acc, on_step=False, on_epoch=True, prog_bar=True)

`training_step(batch, batch_idx)` #

Perform a single training step.

Parameters:

Name	Type	Description	Default
`batch`	`Any`	A tuple containing input images and target labels.	required
`batch_idx`	`int`	The index of the current batch.	required

Returns:

Type	Description
`TensorType[]`	A scalar loss tensor.

Source code in src/models/mnist_module.py

@typechecked
def training_step(self, batch: Any, batch_idx: int) -> TensorType[()]:
    """Perform a single training step.

    Args:
        batch: A tuple containing input images and target labels.
        batch_idx: The index of the current batch.

    Returns:
        A scalar loss tensor.
    """
    x, y = batch
    loss, preds, targets = self.model_step(x, y)
    self.train_loss(loss)
    self.train_acc(preds, targets)
    self.log("train/loss", self.train_loss, on_step=False, on_epoch=True, prog_bar=True)
    self.log("train/acc", self.train_acc, on_step=False, on_epoch=True, prog_bar=True)
    return loss

`validation_step(batch, batch_idx)` #

Perform a single validation step on a batch of data from the validation set.

Parameters:

Name	Type	Description	Default
`batch`	`tuple[Tensor, Tensor]`	A batch of data (a tuple) containing the input tensor of images and target labels.	required
`batch_idx`	`int`	The index of the current batch.	required

Source code in src/models/mnist_module.py

def validation_step(self, batch: tuple[torch.Tensor, torch.Tensor], batch_idx: int) -> None:
    """Perform a single validation step on a batch of data from the validation set.

    Args:
        batch: A batch of data (a tuple) containing the input tensor of images and target
            labels.
        batch_idx: The index of the current batch.
    """
    x, y = batch
    loss, preds, targets = self.model_step(x, y)

    # update and log metrics
    self.val_loss(loss)
    self.val_acc(preds, targets)
    self.log("val/loss", self.val_loss, on_step=False, on_epoch=True, prog_bar=True)
    self.log("val/acc", self.val_acc, on_step=False, on_epoch=True, prog_bar=True)

Mnist module

MNISTLitModule #

__init__(net, optimizer, scheduler, compile_model) #

configure_optimizers() #

forward(x) #

model_step(x, y) #

on_test_epoch_end() #

on_train_epoch_end() #

on_train_start() #

on_validation_epoch_end() #

setup(stage) #

test_step(batch, batch_idx) #

training_step(batch, batch_idx) #

validation_step(batch, batch_idx) #

`MNISTLitModule` #

`init(net, optimizer, scheduler, compile_model)` #

`configure_optimizers()` #

`forward(x)` #

`model_step(x, y)` #

`on_test_epoch_end()` #

`on_train_epoch_end()` #

`on_train_start()` #

`on_validation_epoch_end()` #

`setup(stage)` #

`test_step(batch, batch_idx)` #

`training_step(batch, batch_idx)` #

`validation_step(batch, batch_idx)` #