Merge pull request #180 from IBM/fix/wavelet_activation

Fix/wavelet activation
IBM · Feb 6, 2024 · 8b67528 · 8b67528
2 parents cf0dc64 + 94bede5
commit 8b67528
Show file tree

Hide file tree

Showing 2 changed files with 10 additions and 2 deletions.
diff --git a/simulai/models/_pytorch_models/_transformer.py b/simulai/models/_pytorch_models/_transformer.py
@@ -178,6 +178,7 @@ def __init__(
         decoder_mlp_layer_config: dict = None,
         number_of_encoders: int = 1,
         number_of_decoders: int = 1,
+        devices: Union[str, list] = "cpu",
     ) -> None:
         r"""A classical encoder-decoder transformer:
 
@@ -229,6 +230,9 @@ def __init__(
         self.encoder_mlp_layers_list = list()
         self.decoder_mlp_layers_list = list()
 
+        #Determining the kind of device in which the modelwill be executed
+        self.device = self._set_device(devices=devices)
+
         # Creating independent copies for the MLP layers which will be used
         # by the multiple encoders/decoders.
         for e in range(self.number_of_encoders):
@@ -281,6 +285,11 @@ def __init__(
         self.final_layer = Linear(input_size=self.embed_dim_decoder, output_size=self.output_dim)
         self.add_module("final_linear_layer", self.final_layer)
 
+        #  Sending everything to the proper device
+        self.EncoderStage = self.EncoderStage.to(self.device)
+        self.DecoderStage = self.DecoderStage.to(self.device)
+        self.final_layer = self.final_layer.to(self.device)
+
     @as_tensor
     def forward(
         self, input_data: Union[torch.Tensor, np.ndarray] = None

diff --git a/simulai/templates/_pytorch_network.py b/simulai/templates/_pytorch_network.py
@@ -172,7 +172,7 @@ def _setup_activations(
             activation_op = self._get_operation(operation=activation)
 
             return (
-                (n_layers - 1) * [activation_op]
+                [self._get_operation(operation=activation) for i in range(n_layers - 1)]
                 + [self._get_operation(operation=self.default_last_activation)],
                 (n_layers - 1) * [activation] + [self.default_last_activation],
             )
@@ -212,7 +212,6 @@ def _setup_activations(
 
             return activations_list, activation
 
-
         else:
             raise Exception(
                 "The activation format,"