base_system

`BaseSystem`

Bases: LightningModule

Base class for DL system.

Source code in lightning_boost/systems/base_system.py

class BaseSystem(LightningModule):
    """Base class for DL system."""

    def __init__(
        self,
        models: List[BaseModel] | BaseModel,
        loss: List[TaskLoss] | TaskLoss,
        optimizer: OptimizerCallable,
        lr_scheduler: LRSchedulerCallable | None = None,
        lr_scheduling_policy: LRSchedulingPolicy = LRSchedulingPolicy(),
        train_metrics: List[TaskMetric] | TaskMetric | None = None,
        val_metrics: List[TaskMetric] | TaskMetric | None = None,
        test_metrics: List[TaskMetric] | TaskMetric | None = None,
        *args,
        **kwargs,
    ) -> None:
        """
        Initializes DL system.

        Args:
            models (List[BaseModel]): DL model(s).
            loss (List[TaskLoss] | TaskLoss): Loss function(s).
            optimizer (OptimizerCallable): Optimizer.
            lr_scheduler (LRSchedulerCallable | None, optional): Learning rate scheduler. Defaults to None.
            lr_scheduling_policy (LRSchedulingPolicy | None, optional): Learning rate scheduling policy. Defaults to None.
            train_metrics (List[TaskMetric] | TaskMetric | None, optional): Metric(s) used for training. Defaults to None.
            val_metrics (List[TaskMetric] | TaskMetric | None, optional): Metric(s) used for validation. Defaults to None.
            test_metrics (List[TaskMetric] | TaskMetric | None, optional): Metric(s) used for testing. Defaults to None.
        """

        super().__init__()

        self.models = get_models_dict(models)
        self.loss_functions = get_loss_dict(loss)
        self.optimizer = optimizer
        self.lr_scheduler = lr_scheduler
        self.lr_scheduling_policy = lr_scheduling_policy
        self.train_metrics = get_metrics_dict(train_metrics)
        self.val_metrics = get_metrics_dict(val_metrics)
        self.test_metrics = get_metrics_dict(test_metrics)

    def step(self, inputs: Dict[str, Tensor], targets: Dict[str, Tensor]) -> Dict[str, Tensor]:
        """
        Performs a single step in training/validation/testing.

        Args:
            inputs (Dict[str, Tensor]): Inputs.
            targets (Dict[str, Tensor]): Targets.

        Raises:
            NotImplementedError: Needs to be implemented for a concrete DL system.

        Returns:
            Dict[str, Tensor]: Predictions.
        """

        raise NotImplementedError

    def _base_step(
        self,
        batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
        batch_idx: int,
        test: bool = False,
    ) -> Tensor:
        """
        Closure function for steps in all modes.

        Args:
            batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
            batch_idx (int): Batch index in epoch.
            test (bool, optional): Whether testing mode is active. Defaults to False.

        Returns:
            Tensor: Loss.
        """

        inputs, targets = batch_data
        assert not (self.training and test)

        if self.training:
            mode = 'train'
            metrics = self.train_metrics
        else:
            mode = 'val'
            metrics = self.val_metrics
        if test:
            mode = 'test'
            metrics = self.test_metrics

        predictions = self.step(inputs, targets)
        losses = {}

        # all keys in predictions have to be existent in targets
        assert (
            len(set(predictions.keys()) - set(targets.keys())) == 0
        ), "Keys of predictions and targets muss match!"
        # with multiple predictions, this also holds for loss_functions and metrics
        if len(predictions) > 1:
            assert (
                len(set(predictions.keys()) - set(self.loss_functions.keys())) == 0
            ), "Keys of predictions and loss functions must match!"
            assert (
                len(set(predictions.keys()) - set(metrics.keys())) == 0
            ), "Keys of predictions and metrics must match!"

            for task in predictions:
                for metric_name, metric in metrics[task].items():  # type: ignore
                    label = f"{task}_{mode}_{metric_name}"
                    metric(predictions[task], targets[task])
                    self.log(
                        label,
                        metric,  # type: ignore
                        on_step=self.training,
                        on_epoch=True,
                        sync_dist=True,
                    )
                for loss_name, loss_function in self.loss_functions[task].items():  # type: ignore
                    label = f"{task}_{mode}_{loss_name}"
                    losses[label] = (
                        loss_function(predictions[task], targets[task]),
                        loss_function.weight,
                    )
                    self.log(
                        label,
                        losses[label][0],
                        on_step=self.training,
                        on_epoch=True,
                        sync_dist=True,
                    )
            # compute weighted loss over losses
            loss = torch.sum(
                torch.stack(
                    [weight * task_loss for weight, task_loss in losses.values()],
                    dim=0,
                ),
                dim=0,
            )

            self.log(
                f"{mode}_total-loss",
                loss,
                on_step=self.training,
                on_epoch=True,
                sync_dist=True,
            )
        else:
            loss_functions = next(iter(self.loss_functions.values()))
            metrics = next(iter(metrics.values()))
            y_hat, y = next(iter(predictions.values())), next(iter(targets.values()))
            # there must be at least one loss function
            assert len(loss_functions) > 0, "No loss function specified!"  # type: ignore

            for metric_name, metric in metrics.items():  # type: ignore
                metric(y_hat, y)
                self.log(
                    f"{mode}_{metric_name}",
                    metric,  # type: ignore
                    on_step=self.training,
                    on_epoch=True,
                    sync_dist=True,
                )
            for loss_name, loss_function in loss_functions.items():  # type: ignore
                label = f"{mode}_{loss_name}"
                losses[label] = (
                    loss_function(y_hat, y),
                    loss_function.weight,
                )
                self.log(
                    label,
                    losses[label][0],
                    on_step=self.training,
                    on_epoch=True,
                    sync_dist=True,
                )
            # compute weighted loss over losses
            loss = torch.sum(
                torch.stack(
                    [weight * task_loss for weight, task_loss in losses.values()],
                    dim=0,
                ),
                dim=0,
            )

            self.log(
                f"{mode}_total-loss",
                loss,
                on_step=self.training,
                on_epoch=True,
                sync_dist=True,
            )

        return loss

    def training_step(
        self,
        batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
        batch_idx: int,
    ) -> Tensor:
        """
        Performs step in training mode.

        Args:
            batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
            batch_idx (int): Batch index in epoch.

        Returns:
            Tensor: Loss.
        """

        return self._base_step(batch_data, batch_idx)

    def validation_step(
        self,
        batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
        batch_idx: int,
    ) -> Tensor:
        """
        Performs step in validation mode.

        Args:
            batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
            batch_idx (int): Batch index in epoch.

        Returns:
            Tensor: Loss.
        """

        return self._base_step(batch_data, batch_idx)

    def test_step(
        self,
        batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
        batch_idx: int,
    ) -> Tensor:
        """
        Performs step in testing mode.

        Args:
            batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
            batch_idx (int): Batch index in epoch.

        Returns:
            Tensor: Loss.
        """

        return self._base_step(batch_data, batch_idx, test=True)

    def configure_optimizers(self) -> Dict[str, Any]:
        """
        Configures optimizer and learning rate scheduling.

        Returns:
            Dict[str, Any]: Optimizer, LR scheduling policy.
        """

        optimizer = self.optimizer(self.parameters())

        if self.lr_scheduler is None:
            return {'optimizer': optimizer}

        lr_scheduler = self.lr_scheduler(optimizer)
        lr_scheduling_policy = self.lr_scheduling_policy.bind_lr_scheduler(lr_scheduler)  # type: ignore

        return {'optimizer': optimizer, 'lr_scheduler': lr_scheduling_policy}

`init(models, loss, optimizer, lr_scheduler=None, lr_scheduling_policy=LRSchedulingPolicy(), train_metrics=None, val_metrics=None, test_metrics=None, *args, **kwargs)`

Initializes DL system.

Parameters:

Name	Type	Description	Default
`models`	`List[BaseModel]`	DL model(s).	required
`loss`	`List[TaskLoss] \| TaskLoss`	Loss function(s).	required
`optimizer`	`OptimizerCallable`	Optimizer.	required
`lr_scheduler`	`LRSchedulerCallable \| None`	Learning rate scheduler. Defaults to None.	`None`
`lr_scheduling_policy`	`LRSchedulingPolicy \| None`	Learning rate scheduling policy. Defaults to None.	`LRSchedulingPolicy()`
`train_metrics`	`List[TaskMetric] \| TaskMetric \| None`	Metric(s) used for training. Defaults to None.	`None`
`val_metrics`	`List[TaskMetric] \| TaskMetric \| None`	Metric(s) used for validation. Defaults to None.	`None`
`test_metrics`	`List[TaskMetric] \| TaskMetric \| None`	Metric(s) used for testing. Defaults to None.	`None`

Source code in lightning_boost/systems/base_system.py

def __init__(
    self,
    models: List[BaseModel] | BaseModel,
    loss: List[TaskLoss] | TaskLoss,
    optimizer: OptimizerCallable,
    lr_scheduler: LRSchedulerCallable | None = None,
    lr_scheduling_policy: LRSchedulingPolicy = LRSchedulingPolicy(),
    train_metrics: List[TaskMetric] | TaskMetric | None = None,
    val_metrics: List[TaskMetric] | TaskMetric | None = None,
    test_metrics: List[TaskMetric] | TaskMetric | None = None,
    *args,
    **kwargs,
) -> None:
    """
    Initializes DL system.

    Args:
        models (List[BaseModel]): DL model(s).
        loss (List[TaskLoss] | TaskLoss): Loss function(s).
        optimizer (OptimizerCallable): Optimizer.
        lr_scheduler (LRSchedulerCallable | None, optional): Learning rate scheduler. Defaults to None.
        lr_scheduling_policy (LRSchedulingPolicy | None, optional): Learning rate scheduling policy. Defaults to None.
        train_metrics (List[TaskMetric] | TaskMetric | None, optional): Metric(s) used for training. Defaults to None.
        val_metrics (List[TaskMetric] | TaskMetric | None, optional): Metric(s) used for validation. Defaults to None.
        test_metrics (List[TaskMetric] | TaskMetric | None, optional): Metric(s) used for testing. Defaults to None.
    """

    super().__init__()

    self.models = get_models_dict(models)
    self.loss_functions = get_loss_dict(loss)
    self.optimizer = optimizer
    self.lr_scheduler = lr_scheduler
    self.lr_scheduling_policy = lr_scheduling_policy
    self.train_metrics = get_metrics_dict(train_metrics)
    self.val_metrics = get_metrics_dict(val_metrics)
    self.test_metrics = get_metrics_dict(test_metrics)

`configure_optimizers()`

Configures optimizer and learning rate scheduling.

Returns:

Type	Description
`Dict[str, Any]`	Dict[str, Any]: Optimizer, LR scheduling policy.

Source code in lightning_boost/systems/base_system.py

def configure_optimizers(self) -> Dict[str, Any]:
    """
    Configures optimizer and learning rate scheduling.

    Returns:
        Dict[str, Any]: Optimizer, LR scheduling policy.
    """

    optimizer = self.optimizer(self.parameters())

    if self.lr_scheduler is None:
        return {'optimizer': optimizer}

    lr_scheduler = self.lr_scheduler(optimizer)
    lr_scheduling_policy = self.lr_scheduling_policy.bind_lr_scheduler(lr_scheduler)  # type: ignore

    return {'optimizer': optimizer, 'lr_scheduler': lr_scheduling_policy}

`step(inputs, targets)`

Performs a single step in training/validation/testing.

Parameters:

Name	Type	Description	Default
`inputs`	`Dict[str, Tensor]`	Inputs.	required
`targets`	`Dict[str, Tensor]`	Targets.	required

Raises:

Type	Description
`NotImplementedError`	Needs to be implemented for a concrete DL system.

Returns:

Type	Description
`Dict[str, Tensor]`	Dict[str, Tensor]: Predictions.

Source code in lightning_boost/systems/base_system.py

def step(self, inputs: Dict[str, Tensor], targets: Dict[str, Tensor]) -> Dict[str, Tensor]:
    """
    Performs a single step in training/validation/testing.

    Args:
        inputs (Dict[str, Tensor]): Inputs.
        targets (Dict[str, Tensor]): Targets.

    Raises:
        NotImplementedError: Needs to be implemented for a concrete DL system.

    Returns:
        Dict[str, Tensor]: Predictions.
    """

    raise NotImplementedError

`test_step(batch_data, batch_idx)`

Performs step in testing mode.

Parameters:

Name	Type	Description	Default
`batch_data`	`Tuple[Dict[str, Tensor], Dict[str, Tensor]]`	Inputs, targets.	required
`batch_idx`	`int`	Batch index in epoch.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	Loss.

Source code in lightning_boost/systems/base_system.py

def test_step(
    self,
    batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
    batch_idx: int,
) -> Tensor:
    """
    Performs step in testing mode.

    Args:
        batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
        batch_idx (int): Batch index in epoch.

    Returns:
        Tensor: Loss.
    """

    return self._base_step(batch_data, batch_idx, test=True)

`training_step(batch_data, batch_idx)`

Performs step in training mode.

Parameters:

Name	Type	Description	Default
`batch_data`	`Tuple[Dict[str, Tensor], Dict[str, Tensor]]`	Inputs, targets.	required
`batch_idx`	`int`	Batch index in epoch.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	Loss.

Source code in lightning_boost/systems/base_system.py

def training_step(
    self,
    batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
    batch_idx: int,
) -> Tensor:
    """
    Performs step in training mode.

    Args:
        batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
        batch_idx (int): Batch index in epoch.

    Returns:
        Tensor: Loss.
    """

    return self._base_step(batch_data, batch_idx)

`validation_step(batch_data, batch_idx)`

Performs step in validation mode.

Parameters:

Name	Type	Description	Default
`batch_data`	`Tuple[Dict[str, Tensor], Dict[str, Tensor]]`	Inputs, targets.	required
`batch_idx`	`int`	Batch index in epoch.	required

Returns:

Name	Type	Description
`Tensor`	`Tensor`	Loss.

Source code in lightning_boost/systems/base_system.py

def validation_step(
    self,
    batch_data: Tuple[Dict[str, Tensor], Dict[str, Tensor]],
    batch_idx: int,
) -> Tensor:
    """
    Performs step in validation mode.

    Args:
        batch_data (Tuple[Dict[str, Tensor], Dict[str, Tensor]]): Inputs, targets.
        batch_idx (int): Batch index in epoch.

    Returns:
        Tensor: Loss.
    """

    return self._base_step(batch_data, batch_idx)

base_system

BaseSystem

__init__(models, loss, optimizer, lr_scheduler=None, lr_scheduling_policy=LRSchedulingPolicy(), train_metrics=None, val_metrics=None, test_metrics=None, *args, **kwargs)

configure_optimizers()

step(inputs, targets)

test_step(batch_data, batch_idx)

training_step(batch_data, batch_idx)

validation_step(batch_data, batch_idx)

`BaseSystem`

`init(models, loss, optimizer, lr_scheduler=None, lr_scheduling_policy=LRSchedulingPolicy(), train_metrics=None, val_metrics=None, test_metrics=None, *args, **kwargs)`

`configure_optimizers()`

`step(inputs, targets)`

`test_step(batch_data, batch_idx)`

`training_step(batch_data, batch_idx)`

`validation_step(batch_data, batch_idx)`