Simulai pytorch templates

Neural Network Templates#

NetworkTemplate#

Bases: Module

Source code in simulai/templates/_pytorch_network.py

class NetworkTemplate(torch.nn.Module):
    def __init__(self, name: str = None, devices: str = None) -> None:
        """Template for a generic neural network

        Args:
            name (str): Name for the neural network model.
            devices (str): Kind of device in which the model will run, 
                'cpu' or 'gpu'.

        """
        super(NetworkTemplate, self).__init__()

        # Default choice for the model name
        if name == None:
            name = "nnet"

        self.name = name
        self.engine = torch.nn
        self.suplementary_engines = [torch, simulact]

        self.default_last_activation = None

        self.input_size = None
        self.output_size = None
        self.layers = None
        self.activations = None
        self.initializations = None

        self.shapes_dict = None
        self.device_type = devices
        self.device = self._set_device(devices=devices)

        if self.device_type != "cpu":
            self.to_wrap = self._to_explicit_device
        else:
            self.to_wrap = self._to_bypass

    @property
    def weights_l2(self) -> torch.Tensor:
        """It evaluates the global L^2 norm of all the model coefficients. 
        Returns:
            torch.Tensor: A tensor containing the value of this norm.

        """
        return sum([torch.norm(weight, p=2) for weight in self.weights])

    @property
    def weights_l1(self) -> torch.Tensor:
        """It evaluates the global L^1 norm of all the model coefficients. 
        Returns:
            torch.Tensor: A tensor containing the value of this norm.

        """

        return sum([torch.norm(weight, p=1) for weight in self.weights])

    @property
    def n_parameters(self) -> int:
        """It evaluates the total number of parameters for the model.eval 
        Returns:
            int: The total number of parameters for the model.
        """
        try:
            return int(
                sum([np.prod(tuple(param.shape)) for param in self.parameters()])
            )

        except Exception:
            print(f"Class {self} has no torch.nn.Parameter or attribute self.weights.")

    def _set_device(self, devices: Union[str, list] = "cpu") -> str:
        device = None
        if type(devices) == list():
            raise Exception("In construction.")
        elif type(str):
            if devices == "gpu":
                if torch.cuda.is_available():
                    try:
                        device = "cuda:" + os.environ["LOCAL_RANK"]
                    except KeyError:
                        device = "cuda"
                else:
                    device = "cpu"
            else:
                device = "cpu"

        return device

    def _get_from_guest(self, **kwargs) -> None:
        search_dict = copy.copy(self.__dict__)
        search_dict.update(kwargs)

        for key, value in search_dict.items():
            if hasattr(value, "share_to_host"):
                share_to_host = value.share_to_host

                for k, v in share_to_host.items():
                    print(f"Sharing the key {k} to host with value {v}")
                    setattr(self, k, v)

    # Getting up activation if it exists
    def _get_operation(
        self, operation: str = None, is_activation: bool = True, **kwargs, 
    ) -> callable:
        mod_items = dir(self.engine)
        mod_items_lower = [item.lower() for item in mod_items]

        if operation in mod_items_lower:
            operation_name = mod_items[mod_items_lower.index(operation)]
            operation_class = getattr(self.engine, operation_name)

            if is_activation is True:
                return operation_class(**kwargs)
            else:
                return operation_class
        else:
            try:
                for engine in self.suplementary_engines:
                    res_ = getattr(engine, operation, None)

                    if hasattr(res_, "__mro__"):
                        if torch.nn.Module in res_.__mro__:
                            res = res_
                            print(f"Module {operation} found in {engine}.")
                            return res(**kwargs)
                        else:
                            print(f"Module {operation} not found in {engine}.")
                    else:
                        print(f"Module {operation} not found in {engine}.")

            except AssertionError:
                raise Exception(
                    f"There is no correspondent to {operation} in {self.engine}"
                )

    def _setup_activations(
        self, activation: Union[str, list] = None, n_layers: int = None
    ) -> (list, Union[str, list]):
        if n_layers == None:
            assert self.n_layers, "n_layers is not defined."
            n_layers = self.n_layers

        # It instantiates an operation x^l = \sigma(y^l), in which y^l
        # is the output of the previous linear operation.
        if isinstance(activation, str):
            # Testing to instantiate an example of activation function.
            activation_op = self._get_operation(operation=activation)

            if isinstance(activation_op, simulact.TrainableActivation):

                activations_list = [self._get_operation(operation=activation,
                                                        is_activation=True, device=self.device)
                                    for i in range(n_layers - 1)]

            else:
                activations_list = [self._get_operation(operation=activation)
                                    for i in range(n_layers - 1)]

            return (
                activations_list
                + [self._get_operation(operation=self.default_last_activation)],
                (n_layers - 1) * [activation] + [self.default_last_activation],
            )

        elif isinstance(activation, list) and all(
            [isinstance(el, str) for el in activation]
        ):
            activations_list = list()
            for activation_name in activation:
                activation_op = self._get_operation(
                    operation=activation_name, is_activation=True
                )

                activations_list.append(activation_op)

            return activations_list, activation

        elif isinstance(activation, torch.nn.Module):
            return (
                (n_layers - 1) * [activation]
                + [self._get_operation(operation=self.default_last_activation)],
                (n_layers - 1) * [activation.name] + [self.default_last_activation],
            )

        elif isinstance(activation, list) and all(
            [isinstance(el, torch.nn.Module) for el in activation]
        ):
            activations_list = list()
            for activation_name in activation:
                activation_op = self._get_operation(
                    operation=activation_name, is_activation=True
                )

                activation_op.setup(device=self.device_type)

                activations_list.append(activation_op)

            return activations_list, activation

        else:
            raise Exception(
                "The activation format,"
                f"{type(activation)} is not supported."
            )

    # Instantiating all the linear layers.
    def _setup_hidden_layers(self, last_bias: bool = True) -> List[torch.nn.Module]:
        layers = list()
        input_layer = self._setup_layer(
            self.input_size,
            self.layers_units[0],
            initialization=self.initializations[0],
            first_layer=True,
        )

        layers.append(input_layer)
        self.add_module(self.name + "_" + "input", input_layer)
        self.weights.append(input_layer.weight)

        for li, layer_units in enumerate(self.layers_units[:-1]):
            layer_op = self._setup_layer(
                layer_units,
                self.layers_units[li + 1],
                initialization=self.initializations[li + 1],
            )

            layers.append(layer_op)
            self.add_module(self.name + "_" + str(li), layer_op)
            self.weights.append(layer_op.weight)

        output_layer = self._setup_layer(
            self.layers_units[-1],
            self.output_size,
            initialization=self.initializations[-1],
            bias=last_bias,
        )

        layers.append(output_layer)
        self.add_module(self.name + "_" + str(li + 1), output_layer)
        self.weights.append(output_layer.weight)

        return layers

    # It converts torch.tensor to np.ndarray. It is used for applications
    # employing SciPy optimizers.
    def _numpy_layers(self) -> List[np.ndarray]:
        numpy_layers = [
            [layer.weight.detach().numpy(), layer.bias.detach().numpy()]
            for layer in self.layers
        ]

        return numpy_layers

    # It converts torch.tensor to np.ndarray. It is used for applications
    # employing SciPy optimizers in which gradients are required.
    def _numpy_grad_layers(self) -> List[np.ndarray]:
        numpy_layers = [
            [
                layer.weight.grad.detach().numpy(),
                layer.bias.grad.detach().numpy()[None, :],
            ]
            for layer in self.layers
        ]

        return numpy_layers

    # It stores all the model parameters into a single flatten array, a
    # requirement from the SciPy optimizers.
    def _make_stitch_idx(self) -> np.ndarray:
        stitch_indices = list()
        partitions = list()
        self.n_tensors = len(self.shapes)

        all_dof = 0
        for ii, shape in enumerate(self.shapes):
            n_dof = np.prod(shape)
            idx = np.reshape(np.arange(all_dof, all_dof + n_dof, dtype=np.int32), shape)
            stitch_indices.append(idx)
            all_dof += n_dof
            partitions += [ii] * n_dof

        return stitch_indices

    def _to_explicit_device(
        self, entity: Union[torch.nn.Module, torch.Tensor], device: str = None
    ) -> Union[torch.nn.Module, torch.Tensor]:
        return entity.to(device)

    def _to_bypass(
        self, entity: Union[torch.nn.Module, torch.Tensor], device: str = None
    ) -> Union[torch.nn.Module, torch.Tensor]:
        return entity

    # It returns all the model parameters in a single array.
    def get_parameters(self) -> np.ndarray:
        """Returns all the model coefficients stacked into a single array.

        Returns:
            np.ndarray: A single-column array containing all the model parameters.

        """

        layers = self._numpy_layers()

        return np.hstack([item.flatten() for item in sum(layers, [])])

    # It returns all the gradients of the model parameters in a single array.
    def get_gradients(self) -> np.ndarray:
        """Returns all the model gradients (w.r.t the loss function) stacked into a single array.

        Returns:
            np.ndarray: A single-column array containing all the model gradients for the parameters.

        """

        grads = self._numpy_grad_layers()

        return np.hstack([item.flatten() for item in sum(grads, [])])

    def _set_parameter_from_array(self, data):
        return torch.from_numpy(data.astype(ARRAY_DTYPE))

    def _set_parameter_from_tensor(self, data):
        return data

    # Setting up values for the model parameters.
    def set_parameters(self, parameters:Union[torch.Tensor, np.ndarray]=None, requires_grad=True) -> None:
        """It overwrite the current parameters values with new ones.

        Args:
            parameters (List[torch.Tensor]): List of new values to overwrite the
                current parameters. 

        """

        # Determining the kind of data structure to be converted from
        struct_converter = { 
                            np.ndarray : self._set_parameter_from_array,
                            torch.Tensor : self._set_parameter_from_tensor
                           }.get(type(parameters))

        for ll, layer in enumerate(self.layers_map):

            self.layers[ll].weight = Parameter(
                data=struct_converter(
                    parameters[self.stitch_idx[layer[0]].flatten()].reshape(self.shapes_layers[ll][0])
                ),
                requires_grad=requires_grad,
            )

            self.layers[ll].bias = Parameter(
                data=struct_converter(
                    parameters[self.stitch_idx[layer[1]].flatten()].reshape(self.shapes_layers[ll][1])
                ),
                requires_grad=requires_grad,
            )

    # Detaching parameters from the backpropagation pipeline
    def detach_parameters(self) -> None:
        """Remove the parameters for the PyTorch graph,
            it means that they will not be trainable. 
        """
        for param in self.parameters():
            param.requires_grad = False
            param.data.copy_(param.data.detach())

    # Making evaluations using the network
    def eval(self, input_data: Union[np.ndarray, torch.Tensor] = None) -> np.ndarray:
        """It used the model to perform evaluations.

        Args:
            input_data (Union[np.ndarray, torch.Tensor]): The input data used for the 
                model evaluation.

        Returns:
            np.ndarray: The result of that evaluation. 

        """
        output_tensor = self.forward(input_data=input_data)

        # Guaranteeing the dataset location as CPU
        output_tensor = output_tensor.to("cpu")

        return output_tensor.detach().numpy()

    # It prints a summary of the network architecture.
    def summary(self, display: bool = True, **kwargs) -> None:
        """It prints a basic summary of the model architecure.

        Args:
            display (bool): Display that summary or not.

        """
        import pprint

        if display:
            pprinter = pprint.PrettyPrinter(indent=2)

            print("Summary of the network properties:")

            print("Linear operations layers:\n")
            pprinter.pprint(self.layers)
            print("\n")
            print("Activations layers:\n")
            pprinter.pprint(self.activations_str)
            print("\n")
            print("Initializations at each layer:\n")
            pprinter.pprint(self.initializations)
        else:
            pass

        self.shapes_dict = {"layers": self.layers}

    def save(self, save_dir: str = None, name: str = None, device: str = None) -> None:
        # Moving all the tensors to the destiny device if necessary
        if device is not None:
            print(f"Trying to move all the tensors to the destiny device {device}.")
            for key, value in self.state_dict().items():
                self.state_dict()[key] = value.to(device)
            print("Moving concluded.")
        else:
            pass

        try:
            torch.save(self.state_dict(), os.path.join(save_dir, name + ".pth"))
        except Exception:
            print(f"It was not possible to save {self}")

    def load(self, save_dir: str = None, name: str = None, device: str = None) -> None:
        print(f"Trying to load for {device}")

        try:
            if device != None:
                self.load_state_dict(
                    torch.load(
                        os.path.join(save_dir, name + ".pth"),
                        map_location=torch.device(device),
                    )
                )
            else:
                self.load_state_dict(torch.load(os.path.join(save_dir, name + ".pth")))
        except Exception:
            print(
                f"It was not possible to load from {os.path.join(save_dir, name + '.pth')}"
            )

`n_parameters: int` `property` #

It evaluates the total number of parameters for the model.eval Returns: int: The total number of parameters for the model.

`weights_l1: torch.Tensor` `property` #

It evaluates the global L^1 norm of all the model coefficients. Returns: torch.Tensor: A tensor containing the value of this norm.

`weights_l2: torch.Tensor` `property` #

It evaluates the global L^2 norm of all the model coefficients. Returns: torch.Tensor: A tensor containing the value of this norm.

`init(name=None, devices=None)` #

Template for a generic neural network

Parameters:

Name	Type	Description	Default
`name`	`str`	Name for the neural network model.	`None`
`devices`	`str`	Kind of device in which the model will run, 'cpu' or 'gpu'.	`None`

Source code in simulai/templates/_pytorch_network.py

def __init__(self, name: str = None, devices: str = None) -> None:
    """Template for a generic neural network

    Args:
        name (str): Name for the neural network model.
        devices (str): Kind of device in which the model will run, 
            'cpu' or 'gpu'.

    """
    super(NetworkTemplate, self).__init__()

    # Default choice for the model name
    if name == None:
        name = "nnet"

    self.name = name
    self.engine = torch.nn
    self.suplementary_engines = [torch, simulact]

    self.default_last_activation = None

    self.input_size = None
    self.output_size = None
    self.layers = None
    self.activations = None
    self.initializations = None

    self.shapes_dict = None
    self.device_type = devices
    self.device = self._set_device(devices=devices)

    if self.device_type != "cpu":
        self.to_wrap = self._to_explicit_device
    else:
        self.to_wrap = self._to_bypass

`detach_parameters()` #

Remove the parameters for the PyTorch graph, it means that they will not be trainable.

Source code in simulai/templates/_pytorch_network.py

def detach_parameters(self) -> None:
    """Remove the parameters for the PyTorch graph,
        it means that they will not be trainable. 
    """
    for param in self.parameters():
        param.requires_grad = False
        param.data.copy_(param.data.detach())

`eval(input_data=None)` #

It used the model to perform evaluations.

Parameters:

Name	Type	Description	Default
`input_data`	`Union[ndarray, Tensor]`	The input data used for the model evaluation.	`None`

Returns:

Type	Description
`ndarray`	np.ndarray: The result of that evaluation.

Source code in simulai/templates/_pytorch_network.py

def eval(self, input_data: Union[np.ndarray, torch.Tensor] = None) -> np.ndarray:
    """It used the model to perform evaluations.

    Args:
        input_data (Union[np.ndarray, torch.Tensor]): The input data used for the 
            model evaluation.

    Returns:
        np.ndarray: The result of that evaluation. 

    """
    output_tensor = self.forward(input_data=input_data)

    # Guaranteeing the dataset location as CPU
    output_tensor = output_tensor.to("cpu")

    return output_tensor.detach().numpy()

`get_gradients()` #

Returns all the model gradients (w.r.t the loss function) stacked into a single array.

Returns:

Type	Description
`ndarray`	np.ndarray: A single-column array containing all the model gradients for the parameters.

Source code in simulai/templates/_pytorch_network.py

def get_gradients(self) -> np.ndarray:
    """Returns all the model gradients (w.r.t the loss function) stacked into a single array.

    Returns:
        np.ndarray: A single-column array containing all the model gradients for the parameters.

    """

    grads = self._numpy_grad_layers()

    return np.hstack([item.flatten() for item in sum(grads, [])])

`get_parameters()` #

Returns all the model coefficients stacked into a single array.

Returns:

Type	Description
`ndarray`	np.ndarray: A single-column array containing all the model parameters.

Source code in simulai/templates/_pytorch_network.py

def get_parameters(self) -> np.ndarray:
    """Returns all the model coefficients stacked into a single array.

    Returns:
        np.ndarray: A single-column array containing all the model parameters.

    """

    layers = self._numpy_layers()

    return np.hstack([item.flatten() for item in sum(layers, [])])

`set_parameters(parameters=None, requires_grad=True)` #

It overwrite the current parameters values with new ones.

Parameters:

Name	Type	Description	Default
`parameters`	`List[Tensor]`	List of new values to overwrite the current parameters.	`None`

Source code in simulai/templates/_pytorch_network.py

def set_parameters(self, parameters:Union[torch.Tensor, np.ndarray]=None, requires_grad=True) -> None:
    """It overwrite the current parameters values with new ones.

    Args:
        parameters (List[torch.Tensor]): List of new values to overwrite the
            current parameters. 

    """

    # Determining the kind of data structure to be converted from
    struct_converter = { 
                        np.ndarray : self._set_parameter_from_array,
                        torch.Tensor : self._set_parameter_from_tensor
                       }.get(type(parameters))

    for ll, layer in enumerate(self.layers_map):

        self.layers[ll].weight = Parameter(
            data=struct_converter(
                parameters[self.stitch_idx[layer[0]].flatten()].reshape(self.shapes_layers[ll][0])
            ),
            requires_grad=requires_grad,
        )

        self.layers[ll].bias = Parameter(
            data=struct_converter(
                parameters[self.stitch_idx[layer[1]].flatten()].reshape(self.shapes_layers[ll][1])
            ),
            requires_grad=requires_grad,
        )

`summary(display=True, **kwargs)` #

It prints a basic summary of the model architecure.

Parameters:

Name	Type	Description	Default
`display`	`bool`	Display that summary or not.	`True`

Source code in simulai/templates/_pytorch_network.py

def summary(self, display: bool = True, **kwargs) -> None:
    """It prints a basic summary of the model architecure.

    Args:
        display (bool): Display that summary or not.

    """
    import pprint

    if display:
        pprinter = pprint.PrettyPrinter(indent=2)

        print("Summary of the network properties:")

        print("Linear operations layers:\n")
        pprinter.pprint(self.layers)
        print("\n")
        print("Activations layers:\n")
        pprinter.pprint(self.activations_str)
        print("\n")
        print("Initializations at each layer:\n")
        pprinter.pprint(self.initializations)
    else:
        pass

    self.shapes_dict = {"layers": self.layers}

ConvNetworkTemplate#

Bases: NetworkTemplate

Source code in simulai/templates/_pytorch_network.py

class ConvNetworkTemplate(NetworkTemplate):
    def __init__(self, name: str = None, flatten: bool = None) -> None:
        """A basic template for convolutional neural networks.

        Args:
            name (str): A name for the neural network model. 
            flatten (bool): Flatten the output or not. 

        """
        super(ConvNetworkTemplate, self).__init__()

        self.name = name
        self.flatten = flatten

        if flatten == True:
            self.flattener = self._flatten
        else:
            self.flattener = self._no_flatten

        # When no name is provided, it will employ a random number
        # as model name
        if self.name == None:
            self.name = id(self)

        self.args = []

        # The operation coming before or in the sequence of each convolution layer can be
        # a pooling ou a sampling
        self.before_conv_tag = ""
        self.after_conv_tag = ""
        self.batch_norm_tag = ""

        self.samples_dim = None

        self.case = None

        self.interpolation_prefix = {"1d": "", "2d": "bi", "3d": "tri"}

        self.output_shape = None

        self.shapes_dict = None

    def _no_flatten(self, input_data: torch.Tensor = None) -> torch.Tensor:
        return input_data

    def _flatten(self, input_data: torch.Tensor = None) -> torch.Tensor:
        n_samples, n_channels = input_data.shape[:2]
        collapsible_dimensions = np.prod(input_data.shape[2:])

        return torch.reshape(
            input_data, (n_samples, n_channels * collapsible_dimensions)
        )

    def _setup_layers(self, layers_config: dict = None) -> (list, list, list):
        before_conv_layers = list()
        conv_layers = list()
        after_conv_layers = list()
        batch_norm_layers = list()

        weights = list()

        # Configuring each layer
        for ll, layer_config in enumerate(layers_config):
            assert isinstance(layer_config, dict), (
                "Each entry of the layers list must be a dictionary,"
                f" but received {type(layer_config)}."
            )

            assert all(
                [i in layer_config for i in self.args]
            ), f"The arguments {self.args} must be defined."

            # If a post-conv operation is defined, instantiate it
            if self.before_conv_tag in layer_config:
                assert type(layer_config[self.before_conv_tag]) == dict, (
                    f"If the argument {self.before_conv_tag}"
                    f" is present, it must be dict,"
                    f" but received {type(self.before_conv_tag)}"
                )

                before_conv_layer_config = layer_config.pop(self.before_conv_tag)

                type_ = before_conv_layer_config.pop("type")
                after_conv_layer_ll_template = self._get_operation(
                    operation=type_, is_activation=False
                )

                before_conv_layer_ll = after_conv_layer_ll_template(
                    **before_conv_layer_config
                )

            # By contrast, it must be an identity operation
            else:
                before_conv_layer_ll = torch.nn.Identity()

            # If a post-conv operation is defined, instantiate it
            if self.after_conv_tag in layer_config:
                assert type(layer_config[self.after_conv_tag]) == dict, (
                    f"If the argument {self.after_conv_tag}"
                    f" is present, it must be dict,"
                    f" but received {type(self.after_conv_tag)}"
                )

                after_conv_layer_config = layer_config.pop(self.after_conv_tag)

                type_ = after_conv_layer_config.pop("type")
                after_conv_layer_ll_template = self._get_operation(
                    operation=type_, is_activation=False
                )

                after_conv_layer_ll = after_conv_layer_ll_template(
                    **after_conv_layer_config
                )

            # By contrast, it must be an identity operation
            else:
                after_conv_layer_ll = torch.nn.Identity()

            # If a post-conv operation is defined, instantiate it
            if self.batch_norm_tag in layer_config:
                assert type(layer_config[self.batch_norm_tag]) == dict, (
                    f"If the argument {self.batch_norm_tag}"
                    f" is present, it must be dict,"
                    f" but received {type(self.batch_norm_tag)}"
                )

                batch_norm_layer_config = layer_config.pop(self.batch_norm_tag)

                type_ = batch_norm_layer_config.pop("type")
                batch_norm_layer_ll_template = self._get_operation(
                    operation=type_, is_activation=False
                )

                batch_norm_layer_ll = batch_norm_layer_ll_template(
                    **batch_norm_layer_config
                )

            # By contrast, it must be an identity operation
            else:
                batch_norm_layer_ll = torch.nn.Identity()

            args = [layer_config.pop(arg) for arg in self.args]

            # The convolution layer itself
            conv_layer_ll = self.layer_template(*args, **layer_config)

            before_conv_layers.append(before_conv_layer_ll)
            conv_layers.append(conv_layer_ll)
            after_conv_layers.append(after_conv_layer_ll)
            batch_norm_layers.append(batch_norm_layer_ll)

            # Setting up the individual modules to the global one
            self.add_module(self.name + "_before_conv_" + str(ll), before_conv_layer_ll)
            self.add_module(self.name + "_" + str(ll), conv_layer_ll)
            self.add_module(self.name + "_after_conv_" + str(ll), after_conv_layer_ll)
            self.add_module(self.name + "_batch_norm_" + str(ll), batch_norm_layer_ll)

            weights.append(conv_layer_ll.weight)

            # Batch normalization also has trainable paramters
            if not isinstance(batch_norm_layer_ll, torch.nn.Identity):
                weights.append(batch_norm_layer_ll.weight)

        return (
            before_conv_layers,
            conv_layers,
            after_conv_layers,
            batch_norm_layers,
            weights,
        )

    def _correct_first_dim(self, shapes: list = None) -> list:
        shapes[0] = None

        return shapes

    # Merging the layers into a reasonable sequence
    def _merge(
        self,
        before_conv: list = None,
        conv: list = None,
        act: list = None,
        after_conv: list = None,
        batch_norm: list = None,
    ) -> list:
        merged_list = list()

        for h, i, j, k, l in zip(before_conv, conv, act, batch_norm, after_conv):
            merged_list.append(h)
            merged_list.append(i)
            merged_list.append(j)
            merged_list.append(k)
            merged_list.append(l)

        return merged_list

    # It prints an overview of the network architecture
    def summary(
        self,
        input_data: Union[torch.Tensor, np.ndarray] = None,
        input_shape: list = None,
        device: str = "cpu",
        display: bool = True,
    ) -> None:
        """

        Args:
            input_data (Union[torch.Tensor, np.ndarray]): An input data used for 
                helping to construct the model summary.
            input_shape (list): When input_data is not provided, a shape for it
                can be used instead.
            device (str): The kind of device in which the model will be executed,
                'cpu' or 'gpu'.
            display (bool): Display this summary or not.

        """
        import pprint
        from collections import OrderedDict

        # When no input data is provided, a list containing the shape is used for creating an
        # overview of the network architecture
        if type(input_data) == type(None):
            assert type(input_shape) == list, (
                "If no input data is provided, it is necessary" " to have input_shape."
            )

            input_shape[0] = 1

            input_data = torch.ones(*input_shape).to(device)

        else:
            pass

        if isinstance(input_data, np.ndarray):
            input_data = torch.from_numpy(input_data.astype(ARRAY_DTYPE)).to(device)

        else:
            pass

        input_tensor_ = input_data
        shapes_dict = OrderedDict()

        for layer_id in range(len(self.conv_layers)):
            # Applying operations before convolution
            output_tensor_before_conv = self.before_conv_layers[layer_id](input_tensor_)

            if hasattr(self.after_conv_layers[layer_id], "_get_name"):
                input_shape = self._correct_first_dim(list(input_tensor_.shape))
                output_shape = self._correct_first_dim(
                    list(output_tensor_before_conv.shape)
                )

                shapes_dict[
                    f"{self.before_conv_layers[layer_id]._get_name()}_{layer_id}"
                ] = {"Input shape": input_shape, "Output shape": output_shape}

            # Applying  convolution operations
            output_tensor_conv = self.conv_layers[layer_id](output_tensor_before_conv)

            input_shape = self._correct_first_dim(list(output_tensor_before_conv.shape))
            output_shape = self._correct_first_dim(list(output_tensor_conv.shape))

            shapes_dict[f"{self.conv_layers[layer_id]._get_name()}_{layer_id}"] = {
                "Input shape": input_shape,
                "Output shape": output_shape,
            }

            shapes_dict[f"Activation_{layer_id}"] = self.activations[layer_id]

            output_tensor_after_conv = self.after_conv_layers[layer_id](
                output_tensor_conv
            )

            # Applying operations before convolution
            if hasattr(self.after_conv_layers[layer_id], "_get_name"):
                input_shape = self._correct_first_dim(list(output_tensor_conv.shape))
                output_shape = self._correct_first_dim(
                    list(output_tensor_after_conv.shape)
                )

                shapes_dict[
                    f"{self.after_conv_layers[layer_id]._get_name()}_{layer_id}"
                ] = {"Input shape": input_shape, "Output shape": output_shape}

            input_tensor_ = output_tensor_after_conv

        if display == True:
            pprint.pprint(shapes_dict, indent=2)

        self.shapes_dict = shapes_dict

        output_size = list(shapes_dict.values())[-1]["Output shape"]
        self.input_size = list(shapes_dict.values())[0]["Input shape"]

        # When the network output is reshaped, it is necessary to correct the value of self.output_size
        if self.flatten == True:
            self.output_shape = tuple(output_size)
            self.output_size = int(np.prod(output_size[1:]))
        else:
            self.output_shape = tuple(output_size)
            self.output_size = output_size

`init(name=None, flatten=None)` #

A basic template for convolutional neural networks.

Parameters:

Name	Type	Description	Default
`name`	`str`	A name for the neural network model.	`None`
`flatten`	`bool`	Flatten the output or not.	`None`

Source code in simulai/templates/_pytorch_network.py

def __init__(self, name: str = None, flatten: bool = None) -> None:
    """A basic template for convolutional neural networks.

    Args:
        name (str): A name for the neural network model. 
        flatten (bool): Flatten the output or not. 

    """
    super(ConvNetworkTemplate, self).__init__()

    self.name = name
    self.flatten = flatten

    if flatten == True:
        self.flattener = self._flatten
    else:
        self.flattener = self._no_flatten

    # When no name is provided, it will employ a random number
    # as model name
    if self.name == None:
        self.name = id(self)

    self.args = []

    # The operation coming before or in the sequence of each convolution layer can be
    # a pooling ou a sampling
    self.before_conv_tag = ""
    self.after_conv_tag = ""
    self.batch_norm_tag = ""

    self.samples_dim = None

    self.case = None

    self.interpolation_prefix = {"1d": "", "2d": "bi", "3d": "tri"}

    self.output_shape = None

    self.shapes_dict = None

`summary(input_data=None, input_shape=None, device='cpu', display=True)` #

Parameters:

Name	Type	Description	Default
`input_data`	`Union[Tensor, ndarray]`	An input data used for helping to construct the model summary.	`None`
`input_shape`	`list`	When input_data is not provided, a shape for it can be used instead.	`None`
`device`	`str`	The kind of device in which the model will be executed, 'cpu' or 'gpu'.	`'cpu'`
`display`	`bool`	Display this summary or not.	`True`

Source code in simulai/templates/_pytorch_network.py

def summary(
    self,
    input_data: Union[torch.Tensor, np.ndarray] = None,
    input_shape: list = None,
    device: str = "cpu",
    display: bool = True,
) -> None:
    """

    Args:
        input_data (Union[torch.Tensor, np.ndarray]): An input data used for 
            helping to construct the model summary.
        input_shape (list): When input_data is not provided, a shape for it
            can be used instead.
        device (str): The kind of device in which the model will be executed,
            'cpu' or 'gpu'.
        display (bool): Display this summary or not.

    """
    import pprint
    from collections import OrderedDict

    # When no input data is provided, a list containing the shape is used for creating an
    # overview of the network architecture
    if type(input_data) == type(None):
        assert type(input_shape) == list, (
            "If no input data is provided, it is necessary" " to have input_shape."
        )

        input_shape[0] = 1

        input_data = torch.ones(*input_shape).to(device)

    else:
        pass

    if isinstance(input_data, np.ndarray):
        input_data = torch.from_numpy(input_data.astype(ARRAY_DTYPE)).to(device)

    else:
        pass

    input_tensor_ = input_data
    shapes_dict = OrderedDict()

    for layer_id in range(len(self.conv_layers)):
        # Applying operations before convolution
        output_tensor_before_conv = self.before_conv_layers[layer_id](input_tensor_)

        if hasattr(self.after_conv_layers[layer_id], "_get_name"):
            input_shape = self._correct_first_dim(list(input_tensor_.shape))
            output_shape = self._correct_first_dim(
                list(output_tensor_before_conv.shape)
            )

            shapes_dict[
                f"{self.before_conv_layers[layer_id]._get_name()}_{layer_id}"
            ] = {"Input shape": input_shape, "Output shape": output_shape}

        # Applying  convolution operations
        output_tensor_conv = self.conv_layers[layer_id](output_tensor_before_conv)

        input_shape = self._correct_first_dim(list(output_tensor_before_conv.shape))
        output_shape = self._correct_first_dim(list(output_tensor_conv.shape))

        shapes_dict[f"{self.conv_layers[layer_id]._get_name()}_{layer_id}"] = {
            "Input shape": input_shape,
            "Output shape": output_shape,
        }

        shapes_dict[f"Activation_{layer_id}"] = self.activations[layer_id]

        output_tensor_after_conv = self.after_conv_layers[layer_id](
            output_tensor_conv
        )

        # Applying operations before convolution
        if hasattr(self.after_conv_layers[layer_id], "_get_name"):
            input_shape = self._correct_first_dim(list(output_tensor_conv.shape))
            output_shape = self._correct_first_dim(
                list(output_tensor_after_conv.shape)
            )

            shapes_dict[
                f"{self.after_conv_layers[layer_id]._get_name()}_{layer_id}"
            ] = {"Input shape": input_shape, "Output shape": output_shape}

        input_tensor_ = output_tensor_after_conv

    if display == True:
        pprint.pprint(shapes_dict, indent=2)

    self.shapes_dict = shapes_dict

    output_size = list(shapes_dict.values())[-1]["Output shape"]
    self.input_size = list(shapes_dict.values())[0]["Input shape"]

    # When the network output is reshaped, it is necessary to correct the value of self.output_size
    if self.flatten == True:
        self.output_shape = tuple(output_size)
        self.output_size = int(np.prod(output_size[1:]))
    else:
        self.output_shape = tuple(output_size)
        self.output_size = output_size

Neural Network Templates#

NetworkTemplate#

n_parameters: int property #

weights_l1: torch.Tensor property #

weights_l2: torch.Tensor property #

__init__(name=None, devices=None) #

detach_parameters() #

eval(input_data=None) #

get_gradients() #

get_parameters() #

set_parameters(parameters=None, requires_grad=True) #

summary(display=True, **kwargs) #

ConvNetworkTemplate#

__init__(name=None, flatten=None) #

summary(input_data=None, input_shape=None, device='cpu', display=True) #

`n_parameters: int` `property` #

`weights_l1: torch.Tensor` `property` #

`weights_l2: torch.Tensor` `property` #

`init(name=None, devices=None)` #

`detach_parameters()` #

`eval(input_data=None)` #

`get_gradients()` #

`get_parameters()` #

`set_parameters(parameters=None, requires_grad=True)` #

`summary(display=True, **kwargs)` #

`init(name=None, flatten=None)` #

`summary(input_data=None, input_shape=None, device='cpu', display=True)` #