Module `epiclass.core.model_pytorch`

Model creation module

Classes

class LightningDenseClassifier (input_size, output_size, mapping, hparams, hl_units=3000, nb_layer=1)

Simple dense network handler

Metrics expect probabilities and not logits

Expand source code

class LightningDenseClassifier(pl.LightningModule):
    """Simple dense network handler"""

    def __init__(
        self, input_size, output_size, mapping, hparams, hl_units=3000, nb_layer=1
    ):
        """Metrics expect probabilities and not logits"""
        super().__init__()
        # this is recommended Lightning way to save model arguments
        # it saves everything passed into __init__
        # and allows you to access it as self.myparam1, self.myparam2
        self.save_hyperparameters()  # saves values given to __init__

        # -- general structure --
        self._x_size = input_size
        self._y_size = output_size
        self._hl_size = hl_units  # hl = hidden layer
        self._nb_layer = nb_layer  # number of intermediary/hidden layers
        if self._nb_layer < 1:
            raise AssertionError("Number of layers cannot be less than 1.")

        self._mapping = mapping

        # -- hyperparameters --
        self.l1_scale = hparams.get("l1_scale", 0)
        self.l2_scale = hparams.get("l2_scale", 0.01)
        self.dropout_rate = 1 - hparams.get("keep_prob", 0.5)
        self.learning_rate = hparams.get("learning_rate", 1e-5)

        self._pt_model = self.define_model()

        # Used Metrics
        metrics = MetricCollection(
            [
                Accuracy(num_classes=self._y_size, average="micro"),
                Precision(num_classes=self._y_size, average="macro"),
                Recall(num_classes=self._y_size, average="macro"),
                F1Score(num_classes=self._y_size, average="macro"),
                MatthewsCorrCoef(num_classes=self._y_size),
            ]
        )
        self.metrics = metrics
        self.train_acc = Accuracy(num_classes=self._y_size, average="micro")
        self.valid_acc = Accuracy(num_classes=self._y_size, average="micro")

    @property
    def model(self) -> nn.Module:
        """Return the pytorch model."""
        return self._pt_model

    @property
    def mapping(self) -> Dict[int, str]:
        """Return {output index:label} mapping."""
        return self._mapping

    @property
    def invert_mapping(self) -> Dict[str, int]:
        """Return {label:output index} mapping."""
        return {val: key for key, val in self._mapping.items()}

    # --- Define general model structure ---
    def define_model(self):
        """ref : https://stackoverflow.com/questions/62937388/pytorch-dynamic-amount-of-layers"""
        layer_list = []
        # See the layers as matrix operations, as the weights, not the neurons.

        # input layer
        layer_list.append(nn.Dropout(0.1))  # drop part of input
        layer_list.append(nn.Linear(self._x_size, self._hl_size))
        layer_list.append(
            nn.Dropout(self.dropout_rate)
        )  # apply dropout to 1rst hidden layer
        layer_list.append(nn.ReLU())  # relu on 1rst hidden layer

        # hidden layers
        for _ in range(0, self._nb_layer - 1):
            layer_list.append(nn.Linear(self._hl_size, self._hl_size))
            layer_list.append(nn.ReLU())
            # in case of ReLU, dropout should be applied before for computational efficiency,
            # swapping them gives same result
            # https://sebastianraschka.com/faq/docs/dropout-activation.html

        # output layer
        layer_list.append(nn.Linear(self._hl_size, self._y_size))

        # https://pytorch.org/docs/stable/_modules/torch/nn/modules/container.html#Sequential
        model = nn.Sequential(*layer_list)

        return model

    def configure_optimizers(self):
        """https://pytorch.org/docs/stable/optim.html"""
        optimizer = torch.optim.Adam(
            self.parameters(), lr=self.learning_rate, weight_decay=self.l2_scale
        )
        return optimizer

    # --- Define format of output ---
    def forward(self, x: Tensor):
        """Return logits."""
        return self._pt_model(x)

    def predict_proba(self, x: Tensor) -> Tensor:
        """Return probabilities"""
        self.eval()
        with torch.no_grad():
            logits = self(x)
            probs = F.softmax(logits, dim=1)
        return probs

    def predict_class(self, x: Tensor) -> Tensor:
        """Return class"""
        self.eval()
        with torch.no_grad():
            logits = self(x)
            preds = torch.argmax(logits, dim=1)
        return preds

    # --- Define how training and validation is done, what loss is used ---
    def training_step(self, train_batch, batch_idx):
        """Return training loss and co."""
        x, y = train_batch
        logits = self(x)
        loss = F.cross_entropy(logits, y)

        if self.l1_scale > 0:
            l1_norm = sum(torch.linalg.norm(p, 1) for p in self.parameters())
            loss += self.l1_scale * l1_norm

        preds = torch.argmax(logits, dim=1)
        return {"loss": loss, "preds": preds.detach(), "target": y}

    def training_step_end(self, outputs):  # pylint: disable=arguments-renamed
        """Update and log training metrics."""
        self.train_acc(outputs["preds"], outputs["target"])

        # changing "step" for x-axis change
        metrics = {
            "train_acc": self.train_acc,
            "train_loss": outputs["loss"],
            "step": self.current_epoch + 1.0,
        }
        self.log_dict(metrics, on_step=False, on_epoch=True)

    def validation_step(self, val_batch, batch_idx):
        """Return validation loss and co."""
        x, y = val_batch
        logits = self(x)
        loss = F.cross_entropy(logits, y)
        preds = torch.argmax(logits, dim=1)
        return {"loss": loss, "preds": preds.detach(), "target": y}

    def validation_step_end(self, outputs):
        """Update and log validation metrics."""
        self.valid_acc(outputs["preds"], outputs["target"])

        # changing "step" for x-axis change
        metrics = {
            "valid_acc": self.valid_acc,
            "valid_loss": outputs["loss"],
            "step": self.current_epoch + 1.0,
        }
        self.log_dict(metrics, on_step=False, on_epoch=True, prog_bar=True)

    # --- Other information functions ---
    def print_model_summary(self, batch_size=1):
        """Print torchinfo summary."""
        print("--MODEL SUMMARY--")
        summary(
            model=self,
            input_size=(batch_size, self._x_size),
            col_names=["input_size", "output_size", "num_params"],
        )

    def compute_metrics(self, dataset: TensorDataset):
        """Return dict of metrics for given dataset."""
        self.eval()
        with torch.no_grad():
            features, targets = dataset[:]
            preds = self(features)
        return self.metrics(preds, targets)

    def compute_predictions_from_dataset(
        self, dataset: TensorDataset
    ) -> Tuple[Tensor, Tensor]:
        """Return probability predictions and targets from dataset."""
        self.eval()
        with torch.no_grad():
            features, targets = dataset[:]
            probs = self.predict_proba(features)
        return probs, targets

    def compute_predictions_from_features(self, features: Tensor) -> Tensor:
        """Return probability predictions from features."""
        self.eval()
        with torch.no_grad():
            probs = self.predict_proba(features)
        return probs

    @classmethod
    def restore_model(cls, model_dir, verbose=True):
        """Load the checkpoint of the best model from the last run."""
        path = Path(model_dir) / "best_checkpoint.list"

        if verbose:
            print("Reading checkpoint list and taking last line.")
        with open(path, "r", encoding="utf-8") as ckpt_file:
            lines = ckpt_file.read().splitlines()
            ckpt_path = lines[-1].split(" ")[0]

        if verbose:
            print(f"Loading model from {ckpt_path}")
        return LightningDenseClassifier.load_from_checkpoint(ckpt_path)

Ancestors

pytorch_lightning.core.module.LightningModule
lightning_fabric.utilities.device_dtype_mixin._DeviceDtypeModuleMixin
pytorch_lightning.core.mixins.hparams_mixin.HyperparametersMixin
pytorch_lightning.core.saving.ModelIO
pytorch_lightning.core.hooks.ModelHooks
pytorch_lightning.core.hooks.DataHooks
pytorch_lightning.core.hooks.CheckpointHooks
torch.nn.modules.module.Module

Static methods

def restore_model(model_dir, verbose=True): Load the checkpoint of the best model from the last run.

Instance variables

prop invert_mapping : Dict[str, int]

Return {label:output index} mapping.

Expand source code

@property
def invert_mapping(self) -> Dict[str, int]:
    """Return {label:output index} mapping."""
    return {val: key for key, val in self._mapping.items()}

prop mapping : Dict[int, str]

Return {output index:label} mapping.

Expand source code

@property
def mapping(self) -> Dict[int, str]:
    """Return {output index:label} mapping."""
    return self._mapping

prop model : nn.Module

Return the pytorch model.

Expand source code

@property
def model(self) -> nn.Module:
    """Return the pytorch model."""
    return self._pt_model

Methods

def compute_metrics(self, dataset: TensorDataset): Return dict of metrics for given dataset.
def compute_predictions_from_dataset(self, dataset: TensorDataset) ‑> Tuple[torch.Tensor, torch.Tensor]: Return probability predictions and targets from dataset.
def compute_predictions_from_features(self, features: Tensor) ‑> torch.Tensor: Return probability predictions from features.
def configure_optimizers(self): https://pytorch.org/docs/stable/optim.html
def define_model(self): ref : https://stackoverflow.com/questions/62937388/pytorch-dynamic-amount-of-layers
def forward(self, x: Tensor) ‑> Callable[..., Any]: Return logits.
def predict_class(self, x: Tensor) ‑> torch.Tensor: Return class
def predict_proba(self, x: Tensor) ‑> torch.Tensor: Return probabilities
def print_model_summary(self, batch_size=1): Print torchinfo summary.
def training_step(self, train_batch, batch_idx): Return training loss and co.
def training_step_end(self, outputs): Update and log training metrics.
def validation_step(self, val_batch, batch_idx): Return validation loss and co.
def validation_step_end(self, outputs): Update and log validation metrics.