Source code for torchrl.models.base_model

from abc import ABC, abstractmethod, abstractproperty
from collections import ChainMap

import os
import numpy as np
import torch
import torch.nn as nn

import torchrl.utils as U
from torchrl.nn import ModuleExtended

from multiprocessing import Process


# TODO; Paramters changes, change doc
[docs]class BaseModel(ModuleExtended, ABC):
    """
    Basic TorchRL model. Takes two :obj:`Config` objects that identify
    the body(ies) and head(s) of the model.

    Parameters
    ----------
    model: nn.Module
        A pytorch model.
    batcher: torchrl.batcher
        A torchrl batcher.
    num_epochs: int
        How many times to train over the entire dataset (Default is 1).
    num_mini_batches: int
        How many mini-batches to subset the batch
        (Default is 1, so all the batch is used at once).
    opt_fn: torch.optim
        The optimizer reference function (the constructor, not the instance)
        (Default is Adam).
    opt_params: dict
        Parameters for the optimizer (Default is empty dict).
    clip_grad_norm: float
        Max norm of the gradients, if float('inf') no clipping is done
        (Default is float('inf')).
    loss_coef: float
        Used when sharing networks, should balance the contribution
        of the grads of each model.
    cuda_default: bool
        If True and cuda is supported, use it (Default is True).
    """

    def __init__(self, model, batcher, *, cuda_default=True):
        super().__init__()

        self.model = model
        self.batcher = batcher

        self.memory = U.memories.DefaultMemory()
        self.losses = []
        self.register_losses()
        self.callbacks = U.Callback()
        self.register_callbacks()
        self.logger = None

        # Enable cuda if wanted
        self.cuda_enabled = cuda_default and torch.cuda.is_available()
        if self.cuda_enabled:
            self.model.cuda()

    @property
    @abstractmethod
    def batch_keys(self):
        """
        The batch keys needed for computing all losses.
        This is done to reduce overhead when sampling a dataloader,
        it makes sure only the requested keys are being sampled.
        """

    @property
    @abstractmethod
    def register_losses(self):
        """
        Append losses to ``self.losses``, the losses are used
        at :meth:`optimizer_step` for calculating the gradients.

        Parameters
        ----------
        batch: dict
            The batch should contain all the information necessary
            to compute the gradients.
        """

[docs]    @staticmethod
    @abstractmethod
    def output_layer(input_shape, action_info):
        """
        The final layer of the model, will be appended to the model head.

        Parameters
        ----------
        input_shape: int or tuple
            The shape of the input to this layer.
        action_info: dict
            Dictionary containing information about the action space.

        Examples
        --------
        The output of most PG models have the same dimension as the action,
        but the output of the Value models is rank 1. This is where this is defined.
        """

    @property
    def body(self):
        return self.model.layers[0]

    @property
    def head(self):
        return self.model.layers[1]

    @property
    def name(self):
        return self.__class__.__name__

    def num_steps(self):
        return self.batcher.num_steps

    def register_loss(self, func):
        self.losses.append(func)

    def register_callbacks(self):
        self.callbacks.register_cleanup(self.write_logs)
        self.callbacks.register_cleanup(self.clear_memory)

    def clear_memory(self, batch):
        self.memory.clear()

    def calculate_loss(self, batch):
        losses = {f.__name__: f(batch) for f in self.losses}
        self.memory.losses.append(losses)

        return sum(losses.values())

[docs]    def forward(self, x):
        """
        Defines the computation performed at every call.

        Parameters
        ----------
        x: numpy.ndarray
            The environment state.
        """
        return self.model(x)

[docs]    def attach_logger(self, logger):
        """
        Register a logger to this model.

        Parameters
        ----------
        logger: torchrl.utils.logger
        """
        self.logger = logger

    def wrap_name(self, name):
        return "/".join([self.name, name])

    def add_log(self, name, value, **kwargs):
        self.logger.add_log(name=self.wrap_name(name), value=value, **kwargs)

    def add_tf_only_log(self, name, value, **kwargs):
        self.logger.add_tf_only_log(name=self.wrap_name(name), value=value, **kwargs)

    def add_debug_log(self, name, value, **kwargs):
        self.logger.add_debug(name=self.wrap_name(name), value=value, **kwargs)

    def add_histogram_log(self, name, values, **kwargs):
        self.logger.add_histogram(name=self.wrap_name(name), values=values, **kwargs)

[docs]    def write_logs(self, batch):
        """
        Write logs to the terminal and to a tf log file.

        Parameters
        ----------
        batch: Batch
            Some logs might need the batch for calculation.
        """
        total_loss = 0
        for k in self.memory.losses[0]:
            partial_loss = 0
            for loss in self.memory.losses:
                partial_loss += loss[k]

            partial_loss = partial_loss / len(self.memory.losses)
            total_loss += partial_loss
            self.add_tf_only_log("/".join(["Loss", k]), partial_loss, precision=4)

        self.add_log("Loss/Total", total_loss, precision=4)

[docs]    @classmethod
    def from_config(cls, config, batcher=None, body=None, head=None, **kwargs):
        """
        Creates a model from a configuration file.

        Parameters
        ----------
        config: Config
            Should contatin at least a network definition (``nn_config`` section).
        env: torchrl.envs
            A torchrl environment (Default is None and must be present in the config).
        kwargs: key-word arguments
            Extra arguments that will be passed to the class constructor.

        Returns
        -------
        torchrl.models
            A TorchRL model.
        """
        # env = env or U.env_from_config(config)
        # config.pop('env', None)

        if not "body" in config.nn_config:
            config.nn_config.body = []
        if not "head" in config.nn_config:
            config.nn_config.head = []

        nn_config = config.pop("nn_config")
        model = U.nn_from_config(
            config=nn_config,
            state_info=batcher.get_state_info(),
            action_info=batcher.get_action_info(),
            body=body,
            head=head,
        )

        output_layer = cls.output_layer(
            input_shape=model.get_output_shape(batcher.get_state_info().shape),
            action_info=batcher.get_action_info(),
        )

        model.layers.head.append(output_layer)

        return cls(model=model, batcher=batcher, **config.as_dict(), **kwargs)

    @classmethod
    def from_file(cls, file_path, *args, **kwargs):
        config = U.Config.load(file_path)

        return cls.from_config(config, *args, **kwargs)

    @classmethod
    def from_arch(cls, arch, *args, **kwargs):
        module_path = os.path.abspath(os.path.dirname(__file__))
        path = os.path.join(module_path, "archs", arch)

        return cls.from_file(file_path=path, *args, **kwargs)