From 96784b8f4314d9e3349c843fece0d13a35bf65cc Mon Sep 17 00:00:00 2001
From: letizia iannucci <letizia.iannucci@aalto.fi>
Date: Tue, 7 May 2024 20:54:13 +0300
Subject: [PATCH 1/4] add torch train to vae

---
 tsgm/models/cvae.py | 126 +++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 112 insertions(+), 14 deletions(-)

diff --git a/tsgm/models/cvae.py b/tsgm/models/cvae.py
index 3080f6c..44c779f 100644
--- a/tsgm/models/cvae.py
+++ b/tsgm/models/cvae.py
@@ -1,5 +1,8 @@
 from tensorflow import keras
 import tensorflow as tf
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
 import typing as T
 
 import tsgm.utils
@@ -9,7 +12,10 @@ class BetaVAE(keras.Model):
     """
     beta-VAE implementation for unlabeled time series.
     """
-    def __init__(self, encoder: keras.Model, decoder: keras.Model, beta: float = 1.0, **kwargs) -> None:
+
+    def __init__(
+        self, encoder: keras.Model, decoder: keras.Model, beta: float = 1.0, **kwargs
+    ) -> None:
         """
         :param encoder: An encoder model which takes a time series as input and check
             whether the image is real or fake.
@@ -59,10 +65,14 @@ def call(self, X: tsgm.types.Tensor) -> tsgm.types.Tensor:
             x_decoded = x_decoded.reshape((1, -1))
         return x_decoded
 
-    def _get_reconstruction_loss(self, X: tsgm.types.Tensor, Xr: tsgm.types.Tensor) -> float:
-        reconst_loss = tsgm.utils.reconstruction_loss_by_axis(X, Xr, axis=0) +\
-            tsgm.utils.reconstruction_loss_by_axis(X, Xr, axis=1) +\
-            tsgm.utils.reconstruction_loss_by_axis(X, Xr, axis=2)
+    def _get_reconstruction_loss(
+        self, X: tsgm.types.Tensor, Xr: tsgm.types.Tensor
+    ) -> float:
+        reconst_loss = (
+            tsgm.utils.reconstruction_loss_by_axis(X, Xr, axis=0)
+            + tsgm.utils.reconstruction_loss_by_axis(X, Xr, axis=1)
+            + tsgm.utils.reconstruction_loss_by_axis(X, Xr, axis=2)
+        )
         return reconst_loss
 
     def train_step(self, data: tsgm.types.Tensor) -> T.Dict:
@@ -106,9 +116,44 @@ def generate(self, n: int) -> tsgm.types.Tensor:
         z = tf.random.normal((n, self.latent_dim))
         return self.decoder(z)
 
+    def train_step_torch(self, data: torch.Tensor) -> T.Dict:
+        """
+        Performs a training step using a batch of data, stored in data.
+
+        :param data: A batch of data in a format batch_size x seq_len x feat_dim
+        :type data: torch.Tensor
+
+        :returns: A dict with losses
+        :rtype: T.Dict
+        """
+        z_mean, z_log_var, z = self.encoder(data)
+        reconstruction = self.decoder(z)
+        reconstruction_loss = self._get_reconstruction_loss(data, reconstruction)
+        kl_loss = -0.5 * (1 + z_log_var - torch.square(z_mean) - torch.exp(z_log_var))
+        kl_loss = torch.mean(torch.sum(kl_loss, axis=1))
+        total_loss = reconstruction_loss + kl_loss
+
+        self.total_loss_tracker.update_state(total_loss)
+        self.reconstruction_loss_tracker.update_state(reconstruction_loss)
+        self.kl_loss_tracker.update_state(kl_loss)
+
+        return {
+            "loss": self.total_loss_tracker.result(),
+            "reconstruction_loss": self.reconstruction_loss_tracker.result(),
+            "kl_loss": self.kl_loss_tracker.result(),
+        }
+
 
 class cBetaVAE(keras.Model):
-    def __init__(self, encoder: keras.Model, decoder: keras.Model, latent_dim: int, temporal: bool, beta: float = 1.0, **kwargs) -> None:
+    def __init__(
+        self,
+        encoder: keras.Model,
+        decoder: keras.Model,
+        latent_dim: int,
+        temporal: bool,
+        beta: float = 1.0,
+        **kwargs
+    ) -> None:
         super(cBetaVAE, self).__init__(**kwargs)
         self.beta = beta
         self.encoder = encoder
@@ -134,7 +179,9 @@ def metrics(self) -> T.List:
             self.kl_loss_tracker,
         ]
 
-    def generate(self, labels: tsgm.types.Tensor) -> T.Tuple[tsgm.types.Tensor, tsgm.types.Tensor]:
+    def generate(
+        self, labels: tsgm.types.Tensor
+    ) -> T.Tuple[tsgm.types.Tensor, tsgm.types.Tensor]:
         """
         Generates new data from the model.
 
@@ -145,7 +192,9 @@ def generate(self, labels: tsgm.types.Tensor) -> T.Tuple[tsgm.types.Tensor, tsgm
         :rtype: T.Tuple[tsgm.types.Tensor, tsgm.types.Tensor]
         """
         batch_size = tf.shape(labels)[0]
-        z = tf.random.normal((batch_size, self._seq_len, self.latent_dim), dtype=labels.dtype)
+        z = tf.random.normal(
+            (batch_size, self._seq_len, self.latent_dim), dtype=labels.dtype
+        )
         decoder_input = self._get_decoder_input(z, labels)
         return (self.decoder(decoder_input), labels)
 
@@ -168,20 +217,36 @@ def call(self, data: tsgm.types.Tensor) -> tsgm.types.Tensor:
             x_decoded = x_decoded.reshape((1, -1))
         return x_decoded
 
-    def _get_reconstruction_loss(self, X: tsgm.types.Tensor, Xr: tsgm.types.Tensor) -> float:
-        reconst_loss = tf.reduce_sum(tf.math.squared_difference(X, Xr)) +\
-            tf.reduce_sum(tf.math.squared_difference(tf.reduce_mean(X, axis=1), tf.reduce_mean(Xr, axis=1))) +\
-            tf.reduce_sum(tf.math.squared_difference(tf.reduce_mean(X, axis=2), tf.reduce_mean(Xr, axis=2)))
+    def _get_reconstruction_loss(
+        self, X: tsgm.types.Tensor, Xr: tsgm.types.Tensor
+    ) -> float:
+        reconst_loss = (
+            tf.reduce_sum(tf.math.squared_difference(X, Xr))
+            + tf.reduce_sum(
+                tf.math.squared_difference(
+                    tf.reduce_mean(X, axis=1), tf.reduce_mean(Xr, axis=1)
+                )
+            )
+            + tf.reduce_sum(
+                tf.math.squared_difference(
+                    tf.reduce_mean(X, axis=2), tf.reduce_mean(Xr, axis=2)
+                )
+            )
+        )
         return reconst_loss
 
-    def _get_encoder_input(self, X: tsgm.types.Tensor, labels: tsgm.types.Tensor) -> tsgm.types.Tensor:
+    def _get_encoder_input(
+        self, X: tsgm.types.Tensor, labels: tsgm.types.Tensor
+    ) -> tsgm.types.Tensor:
         if self._temporal:
             return tf.concat([X, labels[:, :, None]], axis=2)
         else:
             rep_labels = tf.repeat(labels[:, None, :], [self._seq_len], axis=1)
             return tf.concat([X, rep_labels], axis=2)
 
-    def _get_decoder_input(self, z: tsgm.types.Tensor, labels: tsgm.types.Tensor) -> tsgm.types.Tensor:
+    def _get_decoder_input(
+        self, z: tsgm.types.Tensor, labels: tsgm.types.Tensor
+    ) -> tsgm.types.Tensor:
         if self._temporal:
             rep_labels = labels[:, :, None]
         else:
@@ -220,3 +285,36 @@ def train_step(self, data: tsgm.types.Tensor) -> T.Dict[str, float]:
             "reconstruction_loss": self.reconstruction_loss_tracker.result(),
             "kl_loss": self.kl_loss_tracker.result(),
         }
+
+    def train_step_torch(
+        self, data: T.Tuple[torch.Tensor, torch.Tensor]
+    ) -> T.Dict[str, float]:
+        """
+        Performs a training step using a batch of data, stored in data.
+
+        :param data: A batch of data in a format batch_size x seq_len x feat_dim
+        :type data: T.Tuple[torch.Tensor, torch.Tensor]
+
+        :returns: A dict with losses
+        :rtype: T.Dict[str, float]
+        """
+        X, labels = data
+        encoder_input = self._get_encoder_input(X, labels)
+        z_mean, z_log_var, z = self.encoder(encoder_input)
+
+        decoder_input = self._get_decoder_input(z_mean, labels)
+        reconstruction = self.decoder(decoder_input)
+        reconstruction_loss = self._get_reconstruction_loss(X, reconstruction)
+        kl_loss = -0.5 * (1 + z_log_var - torch.square(z_mean) - torch.exp(z_log_var))
+        kl_loss = torch.mean(torch.sum(kl_loss, axis=1))
+        total_loss = reconstruction_loss + self.beta * kl_loss
+
+        self.total_loss_tracker.update_state(total_loss)
+        self.reconstruction_loss_tracker.update_state(reconstruction_loss)
+        self.kl_loss_tracker.update_state(kl_loss)
+
+        return {
+            "loss": self.total_loss_tracker.result(),
+            "reconstruction_loss": self.reconstruction_loss_tracker.result(),
+            "kl_loss": self.kl_loss_tracker.result(),
+        }

From 551e3f83d36577792e07b806aa372d99762e5ff2 Mon Sep 17 00:00:00 2001
From: letizia iannucci <letizia.iannucci@aalto.fi>
Date: Tue, 21 May 2024 17:45:50 +0300
Subject: [PATCH 2/4] remove unused imports

---
 tsgm/models/cvae.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/tsgm/models/cvae.py b/tsgm/models/cvae.py
index 44c779f..670b1e4 100644
--- a/tsgm/models/cvae.py
+++ b/tsgm/models/cvae.py
@@ -1,8 +1,6 @@
 from tensorflow import keras
 import tensorflow as tf
 import torch
-import torch.nn as nn
-import torch.nn.functional as F
 import typing as T
 
 import tsgm.utils

From f261b4e1229be7a82477e4276ab8b77163dcd5f2 Mon Sep 17 00:00:00 2001
From: letizia iannucci <letizia.iannucci@aalto.fi>
Date: Tue, 21 May 2024 17:57:44 +0300
Subject: [PATCH 3/4] add torch

---
 requirements/requirements.txt | 1 +
 1 file changed, 1 insertion(+)

diff --git a/requirements/requirements.txt b/requirements/requirements.txt
index 93ec81d..52a9f91 100644
--- a/requirements/requirements.txt
+++ b/requirements/requirements.txt
@@ -11,5 +11,6 @@ optuna
 prettytable
 seaborn
 scikit-learn
+torch
 yfinance==0.2.28
 tqdm

From d60233a0cd7713549bd66fcf1f1b503e9459a88b Mon Sep 17 00:00:00 2001
From: letizia iannucci <letizia.iannucci@aalto.fi>
Date: Mon, 3 Jun 2024 18:00:52 +0300
Subject: [PATCH 4/4] tf ops

---
 tsgm/models/cvae.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tsgm/models/cvae.py b/tsgm/models/cvae.py
index 670b1e4..46baad9 100644
--- a/tsgm/models/cvae.py
+++ b/tsgm/models/cvae.py
@@ -127,8 +127,8 @@ def train_step_torch(self, data: torch.Tensor) -> T.Dict:
         z_mean, z_log_var, z = self.encoder(data)
         reconstruction = self.decoder(z)
         reconstruction_loss = self._get_reconstruction_loss(data, reconstruction)
-        kl_loss = -0.5 * (1 + z_log_var - torch.square(z_mean) - torch.exp(z_log_var))
-        kl_loss = torch.mean(torch.sum(kl_loss, axis=1))
+        kl_loss = -0.5 * (1 + z_log_var - tf.square(z_mean) - tf.exp(z_log_var))
+        kl_loss = tf.reduce_mean(tf.reduce_sum(kl_loss, axis=1))
         total_loss = reconstruction_loss + kl_loss
 
         self.total_loss_tracker.update_state(total_loss)
@@ -303,8 +303,8 @@ def train_step_torch(
         decoder_input = self._get_decoder_input(z_mean, labels)
         reconstruction = self.decoder(decoder_input)
         reconstruction_loss = self._get_reconstruction_loss(X, reconstruction)
-        kl_loss = -0.5 * (1 + z_log_var - torch.square(z_mean) - torch.exp(z_log_var))
-        kl_loss = torch.mean(torch.sum(kl_loss, axis=1))
+        kl_loss = -0.5 * (1 + z_log_var - tf.square(z_mean) - tf.exp(z_log_var))
+        kl_loss = tf.reduce_mean(tf.reduce_sum(kl_loss, axis=1))
         total_loss = reconstruction_loss + self.beta * kl_loss
 
         self.total_loss_tracker.update_state(total_loss)