Made no activation function in between hidden layers possible, allow for direct passing of torch modules

RandomDefaultUser · RandomDefaultUser · commit d6152169a847 · 2025-03-18T15:42:47.000+01:00
diff --git a/mala/common/parameters.py b/mala/common/parameters.py
@@ -350,10 +350,13 @@ class ParametersNetwork(ParametersBase):
         activation function is used for all layers (including the output layer,
         i.e., an output activation is used!). Otherwise, the activation
         functions are added layer by layer.
+        Note that no activation function is applied between input layer and
+        first hidden layer!
         Currently supported activation functions are:
 
             - Sigmoid
             - ReLU
+            - None (no activation used)
             - LeakyReLU (default)
 
     loss_function_type : string
diff --git a/mala/network/network.py b/mala/network/network.py
@@ -231,17 +231,18 @@ def __init__(self, params):
         # We should NOT modify the list itself. This would break the
         # hyperparameter algorithms.
         use_only_one_activation_type = False
-        if type(self.params.layer_activations) == str:
-            use_only_one_activation_type = True
-        elif len(self.params.layer_activations) > self.number_of_layers:
-            printout(
-                "Too many activation layers provided. The last",
-                str(
-                    len(self.params.layer_activations) - self.number_of_layers
-                ),
-                "activation function(s) will be ignored.",
-                min_verbosity=1,
-            )
+
+        if not isinstance(self.params.layer_activations, str):
+            if len(self.params.layer_activations) > self.number_of_layers:
+                printout(
+                    "Too many activation layers provided. The last",
+                    str(
+                        len(self.params.layer_activations)
+                        - self.number_of_layers
+                    ),
+                    "activation function(s) will be ignored.",
+                    min_verbosity=1,
+                )
 
         # Add the layers.
         # As this is a feedforward NN we always add linear layers, and then
@@ -256,22 +257,18 @@ def __init__(self, params):
                 )
             )
             try:
-                if use_only_one_activation_type:
-                    self.layers.append(
-                        self._activation_mappings[
-                            self.params.layer_activations
-                        ]()
+                if isinstance(self.params.layer_activations, str):
+                    self._append_activation_function(
+                        self.params.layer_activations
                     )
                 else:
-                    self.layers.append(
-                        self._activation_mappings[
-                            self.params.layer_activations[i]
-                        ]()
+                    self._append_activation_function(
+                        self.params.layer_activations[i]
                     )
             except KeyError:
                 raise Exception("Invalid activation type seleceted.")
             except IndexError:
-                # Layer without activation
+                # No activation functions left to append at the end.
                 pass
 
         # Once everything is done, we can move the Network on the target
@@ -297,6 +294,24 @@ def forward(self, inputs):
             inputs = layer(inputs)
         return inputs
 
+    def _append_activation_function(self, activation_function):
+        """
+        Append an activation function to the network.
+
+        Parameters
+        ----------
+        activation_function : str
+            Activation function to be appended.
+        """
+        if activation_function is None:
+            pass
+        elif isinstance(activation_function, str):
+            self.layers.append(
+                self._activation_mappings[activation_function]()
+            )
+        elif isinstance(activation_function, nn.Module):
+            self.layers.append(activation_function)
+
 
 class LSTM(Network):
     """Initialize this network as a LSTM network."""