Source code for qulearn.trainer

from enum import Enum
from typing import Dict, Optional

import torch
from torch import nn

from .qkernel import QKernel
from .types import DataLoader, Logger, Loss, Metric, Model, Optimizer, Parameter, Tensor, Writer


[docs] class EpochType(Enum): """ Enum to denote the type of epoch in the training process. :cvar Train: Indicates the epoch is a training epoch. :cvar Validate: Indicates the epoch is a validation epoch. """ Train = 1 Validate = 2
[docs] class SupervisedTrainer: """ Class to handle the training of a supervised learning model. :param optimizer: The optimizer to be used in the training process. :type optimizer: Optimizer :param loss_fn: The loss function used for optimization. :type loss_fn: Loss :param num_epochs: The number of epochs to train for. :type num_epochs: int :param metrics: A dictionary mapping metric names to the metric functions to be evaluated. Defaults to empty dict. :type metrics: Dict[str, Metric], optional :param writer: An optional writer for logging purposes. Default is None. :type writer: Optional[Writer] :param logger: An optional logger for logging purposes. Default is None. :type logger: Optional[Logger] """ def __init__( self, optimizer: Optimizer, loss_fn: Loss, num_epochs: int, metrics: Dict[str, Metric] = {}, writer: Optional[Writer] = None, logger: Optional[Logger] = None, ) -> None: self.optimizer = optimizer self.loss_fn = loss_fn self.metrics = metrics self.num_epochs = num_epochs self.writer = writer self.logger = logger
[docs] def train(self, model: Model, train_data: DataLoader, valid_data: DataLoader) -> None: """ Train the given model using the provided data loaders. :param model: The model to be trained. :type model: Model :param train_data: The DataLoader for the training data. :type train_data: DataLoader :param valid_data: The DataLoader for the validation data. :type valid_data: DataLoader """ for epoch in range(1, self.num_epochs + 1): self.train_epoch(model, train_data, epoch) self.validate_epoch(model, valid_data, epoch)
[docs] def train_epoch(self, model: Model, train_data: DataLoader, epoch: int = 0) -> None: """ Train the model for one epoch. :param model: The model to be trained. :type model: Model :param train_data: The DataLoader for the training data. :type train_data: DataLoader :param epoch: The current epoch number. Default is 0. :type epoch: int """ epoch_type = EpochType.Train self._epoch(epoch_type, model, train_data, epoch)
[docs] def validate_epoch(self, model: Model, valid_data: DataLoader, epoch: int = 0) -> None: """ Validate the model after an epoch of training. :param model: The model to be validated. :type model: Model :param valid_data: The DataLoader for the validation data. :type valid_data: DataLoader :param epoch: The current epoch number. Default is 0. :type epoch: int """ epoch_type = EpochType.Validate self._epoch(epoch_type, model, valid_data, epoch)
def _epoch(self, epoch_type: EpochType, model: Model, data: DataLoader, epoch: int = 0) -> None: running_loss = 0.0 running_metrics = {} for metric in self.metrics: running_metrics[metric] = 0.0 if epoch_type == EpochType.Train: for inputs, labels in data: self._train_step(model, inputs, labels) for inputs, labels in data: with torch.no_grad(): predicted = model(inputs) loss = self.loss_fn(predicted, labels) running_loss += loss.item() * len(inputs) for metric in self.metrics: metric_val = self.metrics[metric](predicted, labels) running_metrics[metric] += metric_val.item() * len(inputs) running_loss /= float(len(data.dataset)) # type: ignore for metric in self.metrics: running_metrics[metric] /= float(len(data.dataset)) # type: ignore phase = epoch_type.name self._log_metrics(phase, running_loss, running_metrics, epoch) def _train_step(self, model: Model, inputs: Tensor, labels: Tensor) -> None: self.optimizer.zero_grad() predicted = model(inputs) loss = self.loss_fn(predicted, labels) loss.backward() self.optimizer.step() def _log_metrics(self, phase: str, loss: float, metrics: Dict[str, float], epoch: int) -> None: if self.writer is not None: self.writer.add_scalar(f"Loss/{phase}", loss, epoch) for metric_name, metric_value in metrics.items(): self.writer.add_scalar(f"Metrics/{phase}/{metric_name}", metric_value, epoch) if self.logger is not None: metrics_strs = [ f"{metric_name}: {metric_value:.6f}" for metric_name, metric_value in metrics.items() ] self.logger.info( f"{phase} - Epoch: {epoch}, Loss: {loss:.6f}, Metrics: {', '.join(metrics_strs)}" )
[docs] class RidgeRegression: """ Class to handle the training of a model using Ridge Regression. :param lambda_reg: Regularization strength. Must be positive. :type lambda_reg: float :param metrics: A dictionary mapping metric names to the metric functions to be evaluated. Defaults to empty dict. :type metrics: Dict[str, Metric], optional :param logger: An optional logger for logging purposes. Default is None. :type logger: Optional[Logger] """ def __init__( self, lambda_reg: float, metrics: Dict[str, Metric] = {}, logger: Optional[Logger] = None, ) -> None: self.lambda_reg = lambda_reg self.metrics = metrics self.logger = logger
[docs] def train(self, model: QKernel, train_data: DataLoader, valid_data: DataLoader) -> None: """ Train the given model using the provided data loaders using Ridge Regression. :param model: The quantum kernel model to be trained. :type model: QKernel :param train_data: The DataLoader for the training data. :type train_data: DataLoader :param valid_data: The DataLoader for the validation data. :type valid_data: DataLoader .. warning:: Training changes the state of the model by assigning `X_train`. """ if len(train_data) != 1: raise ValueError("For ridge regression batching training data is invalid") if len(valid_data) != 1: raise ValueError("For ridge regression batching validation data is invalid") for inputs, labels in train_data: model.X_train = inputs alpha = self.kernel_ridge_regression(model, inputs, labels) model.alpha = alpha phase = EpochType.Train.name running_metrics = {} for inputs, labels in train_data: predicted = model(inputs) for metric in self.metrics: running_metrics[metric] = self.metrics[metric](predicted, labels) self._log_metrics(phase, running_metrics) phase = EpochType.Validate.name running_metrics = {} for inputs, labels in valid_data: predicted = model(inputs) for metric in self.metrics: running_metrics[metric] = self.metrics[metric](predicted, labels) self._log_metrics(phase, running_metrics)
[docs] def kernel_ridge_regression(self, model: QKernel, inputs: Tensor, labels: Tensor) -> Parameter: """ Compute Ridge Regression solution for the given inputs and labels using the provided model. :param model: The quantum kernel model. :type model: QKernel :param inputs: Input data tensor. :type inputs: Tensor :param labels: Corresponding labels tensor. :type labels: Tensor :return: The computed alpha parameter tensor. :rtype: Parameter """ linputs = len(inputs.shape) if linputs != 2: raise ValueError(f"Inputs must have 2 dimensions each, not {linputs}") K = model.kernel_matrix(inputs, inputs) num_samples = inputs.shape[0] Id = torch.eye(num_samples, dtype=labels.dtype, device=labels.device) M = K + self.lambda_reg * Id alpha = nn.Parameter(torch.linalg.solve(M, labels)) return alpha
[docs] def _log_metrics(self, phase: str, metrics: Dict[str, float]) -> None: """ Log computed metrics for the provided phase. :param phase: The phase (train or validate) being logged. :type phase: str :param metrics: Dictionary of computed metrics. :type metrics: Dict[str, float] """ if self.logger is not None: metrics_strs = [ f"{metric_name}: {metric_value:.6f}" for metric_name, metric_value in metrics.items() ] self.logger.info(f"{phase} - Metrics: {', '.join(metrics_strs)}")