PyPI - dsipts - Versions diffs - 1.1.9__py3-none-any.whl → 1.1.11__py3-none-any.whl - Mend

dsipts 1.1.9py3-none-any.whl → 1.1.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

dsipts/data_structure/data_structure.py +38 -16
dsipts/models/ITransformer.py +2 -8
dsipts/models/TTM.py +58 -165
dsipts/models/base.py +52 -38
dsipts/models/base_v2.py +55 -37
dsipts/models/utils.py +7 -5
{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/METADATA +1 -1
{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/RECORD +10 -10
{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/WHEEL +0 -0
{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/top_level.txt +0 -0

dsipts/data_structure/data_structure.py CHANGED Viewed

@@ -35,7 +35,18 @@ from .modifiers import *
 from aim.pytorch_lightning import AimLogger
 import time
+class DummyScaler():
+    def __init__(self):
+        pass
+    def fit(self,x):
+        pass
+    def transform(self,x):
+        return x
+    def inverse_transform(self,x):
+        return x
+    def fit_transform(self,x):
+        return x
 pd.options.mode.chained_assignment = None
 log = logging.getLogger(__name__)
@@ -210,20 +221,23 @@ class TimeSeries():
         self.future_variables = []
         self.target_variables = ['signal']
         self.num_var = list(set(self.past_variables).union(set(self.future_variables)).union(set(self.target_variables)))
+        self.num_var = list(np.sort(self.num_var))
     def enrich(self,dataset,columns):
-        if columns =='hour':
-            dataset[columns] = dataset.time.dt.hour
-        elif columns=='dow':
-            dataset[columns] = dataset.time.dt.weekday
-        elif columns=='month':
-            dataset[columns] = dataset.time.dt.month
-        elif columns=='minute':
-            dataset[columns] = dataset.time.dt.minute
-        else:
-            if columns  not in dataset.columns:
-                beauty_string(f'I can not automatically enrich column {columns}. Please contact the developers or add it manually to your dataset.','section',True)
+        try:
+            if columns =='hour':
+                dataset[columns] = dataset.time.dt.hour
+            elif columns=='dow':
+                dataset[columns] = dataset.time.dt.weekday
+            elif columns=='month':
+                dataset[columns] = dataset.time.dt.month
+            elif columns=='minute':
+                dataset[columns] = dataset.time.dt.minute
+            else:
+                if columns  not in dataset.columns:
+                    beauty_string(f'I can not automatically enrich column {columns}. Please contact the developers or add it manually to your dataset.','section',True)
+        except:
+            beauty_string(f'I can not automatically enrich column {columns}. Probably not a temporal index.','section',True)
     def load_signal(self,data:pd.DataFrame,
                     enrich_cat:List[str] = [],
@@ -300,7 +314,7 @@ class TimeSeries():
             if check_past:
                 beauty_string('I will update past column adding all target columns, if you want to avoid this beahviour please use check_pass as false','info',self.verbose)
                 past_variables = list(set(past_variables).union(set(target_variables)))
+                past_variables = list(np.sort(past_variables))
         self.cat_past_var = cat_past_var
         self.cat_fut_var = cat_fut_var
@@ -321,14 +335,18 @@ class TimeSeries():
                 beauty_string('Categorical {c} already present, it will be added to categorical variable but not call the enriching function','info',self.verbose)
             else:
                 self.enrich(dataset,c)
+        self.cat_past_var = list(np.sort(self.cat_past_var))
+        self.cat_fut_var = list(np.sort(self.cat_fut_var))
         self.cat_var = list(set(self.cat_past_var+self.cat_fut_var)) ## all categorical data
+        self.cat_var = list(np.sort(self.cat_var))
         self.dataset = dataset
         self.past_variables = past_variables
         self.future_variables = future_variables
         self.target_variables = target_variables
         self.out_vars = len(target_variables)
         self.num_var = list(set(self.past_variables).union(set(self.future_variables)).union(set(self.target_variables)))
+        self.num_var = list(np.sort(self.num_var))
         if silly_model:
             beauty_string('YOU ARE TRAINING A SILLY MODEL WITH THE TARGETS IN THE INPUTS','section',self.verbose)
             self.future_variables+=self.target_variables
@@ -665,7 +683,11 @@ class TimeSeries():
         #self.model.apply(weight_init_zeros)
         self.config = config
+        try:
+            self.model = torch.compile(self.model)
+        except:
+            beauty_string('Can not compile the model','block',self.verbose)
         beauty_string('Setting the model','block',self.verbose)
         beauty_string(model,'',self.verbose)

dsipts/models/ITransformer.py CHANGED Viewed

@@ -8,6 +8,8 @@ import numpy as np
 from .itransformer.Transformer_EncDec import Encoder, EncoderLayer
 from .itransformer.SelfAttention_Family import FullAttention, AttentionLayer
 from .itransformer.Embed import DataEmbedding_inverted
+from ..data_structure.utils import beauty_string
+from .utils import  get_scope,get_activation,Embedding_cat_variables
 try:
     import lightning.pytorch as pl
@@ -17,12 +19,6 @@ except:
     import pytorch_lightning as pl
     OLD_PL = True
     from .base import Base
-from .utils import QuantileLossMO,Permute, get_activation
-from typing import List, Union
-from ..data_structure.utils import beauty_string
-from .utils import  get_scope
-from .utils import Embedding_cat_variables
@@ -34,8 +30,6 @@ class ITransformer(Base):
     description = get_scope(handle_multivariate,handle_future_covariates,handle_categorical_variables,handle_quantile_loss)
     def __init__(self,
                  # specific params
                  hidden_size:int,
                  d_model: int,

dsipts/models/TTM.py CHANGED Viewed

@@ -12,240 +12,133 @@ except:
     from .base import Base
-from typing import List,Union
-from .utils import  QuantileLossMO
+from .ttm.utils import get_model, get_frequency_token, count_parameters
 from ..data_structure.utils import beauty_string
-from .ttm.utils import get_model, get_frequency_token, count_parameters, RMSELoss
+from .utils import  get_scope
 class TTM(Base):
+    handle_multivariate = True
+    handle_future_covariates = True
+    handle_categorical_variables = True
+    handle_quantile_loss = True
+    description = get_scope(handle_multivariate,handle_future_covariates,handle_categorical_variables,handle_quantile_loss)
     def __init__(self,
                 model_path:str,
-                past_steps:int,
-                future_steps:int,
-                freq_prefix_tuning:bool,
-                freq:str,
                 prefer_l1_loss:bool,  # exog: set true to use l1 loss
                 prefer_longer_context:bool,
-                loss_type:str,
-                num_input_channels,
                 prediction_channel_indices,
-                exogenous_channel_indices,
+                exogenous_channel_indices_cont,
+                exogenous_channel_indices_cat,
                 decoder_mode,
+                freq,
+                freq_prefix_tuning,
                 fcm_context_length,
                 fcm_use_mixer,
                 fcm_mix_layers,
                 fcm_prepend_past,
                 enable_forecast_channel_mixing,
-                out_channels:int,
-                embs:List[int],
-                remove_last = False,
-                optim:Union[str,None]=None,
-                optim_config:dict=None,
-                scheduler_config:dict=None,
-                verbose = False,
-                use_quantiles=False,
-                persistence_weight:float=0.0,
-                quantiles:List[int]=[],
                 **kwargs)->None:
-        """TODO and FIX for future and past categorical variables
-        Args:
-            model_path (str): _description_
-            past_steps (int): _description_
-            future_steps (int): _description_
-            freq_prefix_tuning (bool): _description_
-            freq (str): _description_
-            prefer_l1_loss (bool): _description_
-            loss_type (str): _description_
-            num_input_channels (_type_): _description_
-            prediction_channel_indices (_type_): _description_
-            exogenous_channel_indices (_type_): _description_
-            decoder_mode (_type_): _description_
-            fcm_context_length (_type_): _description_
-            fcm_use_mixer (_type_): _description_
-            fcm_mix_layers (_type_): _description_
-            fcm_prepend_past (_type_): _description_
-            enable_forecast_channel_mixing (_type_): _description_
-            out_channels (int): _description_
-            embs (List[int]): _description_
-            remove_last (bool, optional): _description_. Defaults to False.
-            optim (Union[str,None], optional): _description_. Defaults to None.
-            optim_config (dict, optional): _description_. Defaults to None.
-            scheduler_config (dict, optional): _description_. Defaults to None.
-            verbose (bool, optional): _description_. Defaults to False.
-            use_quantiles (bool, optional): _description_. Defaults to False.
-            persistence_weight (float, optional): _description_. Defaults to 0.0.
-            quantiles (List[int], optional): _description_. Defaults to [].
-        """
-        super(TTM, self).__init__(verbose)
+        super().__init__(**kwargs)
         self.save_hyperparameters(logger=False)
-        self.future_steps = future_steps
-        self.use_quantiles = use_quantiles
-        self.optim = optim
-        self.optim_config = optim_config
-        self.scheduler_config = scheduler_config
-        self.persistence_weight = persistence_weight
-        self.loss_type = loss_type
-        self.remove_last = remove_last
-        self.embs = embs
-        self.freq = freq
-        self.extend_variables = False
-        # NOTE: For Hydra
-        prediction_channel_indices = list(prediction_channel_indices)
-        exogenous_channel_indices = list(exogenous_channel_indices)
-        if len(quantiles)>0:
-            assert len(quantiles)==3, beauty_string('ONLY 3 quantiles premitted','info',True)
-            self.use_quantiles = True
-            self.mul = len(quantiles)
-            self.loss = QuantileLossMO(quantiles)
-            self.extend_variables = True
-            if out_channels * 3 != len(prediction_channel_indices):
-                prediction_channel_indices, exogenous_channel_indices, num_input_channels = self.__add_quantile_features(prediction_channel_indices,
-                                                                                                                         exogenous_channel_indices,
-                                                                                                                         out_channels)
+        self.index_fut = list(exogenous_channel_indices_cont)
+        if len(exogenous_channel_indices_cat)>0:
+            self.index_fut_cat = (self.past_channels+len(self.embs_past))+list(exogenous_channel_indices_cat)
         else:
-            self.mul = 1
-            if self.loss_type == 'mse':
-                self.loss = nn.MSELoss(reduction="mean")
-            elif self.loss_type == 'rmse':
-                self.loss = RMSELoss()
-            else:
-                self.loss = nn.L1Loss()
+            self.index_fut_cat = []
+        self.freq = freq
         self.model = get_model(
             model_path=model_path,
-            context_length=past_steps,
-            prediction_length=future_steps,
-            freq_prefix_tuning=freq_prefix_tuning,
-            freq=freq,
+            context_length=self.past_steps,
+            prediction_length=self.future_steps,
             prefer_l1_loss=prefer_l1_loss,
             prefer_longer_context=prefer_longer_context,
-            num_input_channels=num_input_channels,
+            num_input_channels=self.past_channels+len(self.embs_past), #giusto
             decoder_mode=decoder_mode,
             prediction_channel_indices=list(prediction_channel_indices),
-            exogenous_channel_indices=list(exogenous_channel_indices),
+            exogenous_channel_indices=self.index_fut + self.index_fut_cat,
             fcm_context_length=fcm_context_length,
             fcm_use_mixer=fcm_use_mixer,
             fcm_mix_layers=fcm_mix_layers,
+            freq=freq,
+            freq_prefix_tuning=freq_prefix_tuning,
             fcm_prepend_past=fcm_prepend_past,
-            #loss='mse',
             enable_forecast_channel_mixing=enable_forecast_channel_mixing,
         )
-        self.__freeze_backbone()
-    def __add_quantile_features(self, prediction_channel_indices, exogenous_channel_indices, out_channels):
-        prediction_channel_indices = list(range(out_channels * 3))
-        exogenous_channel_indices = [prediction_channel_indices[-1] + i for i in range(1, len(exogenous_channel_indices)+1)]
-        num_input_channels = len(prediction_channel_indices) + len(exogenous_channel_indices)
-        return prediction_channel_indices, exogenous_channel_indices, num_input_channels
+        hidden_size =  self.model.config.hidden_size
+        self.model.prediction_head = torch.nn.Linear(hidden_size, self.out_channels*self.mul)
+        self._freeze_backbone()
-    def __freeze_backbone(self):
+    def _freeze_backbone(self):
         """
         Freeze the backbone of the model.
         This is useful when you want to fine-tune only the head of the model.
         """
-        print(
-            "Number of params before freezing backbone",
-            count_parameters(self.model),
-        )
+        beauty_string(f"Number of params before freezing backbone:{count_parameters(self.model)}",'info',self.verbose)
         # Freeze the backbone of the model
         for param in self.model.backbone.parameters():
             param.requires_grad = False
         # Count params
-        print(
-            "Number of params after freezing the backbone",
-            count_parameters(self.model),
-        )
+        beauty_string(f"Number of params after freezing the backbone: {count_parameters(self.model)}",'info',self.verbose)
-    def __scaler(self, input):
-        #new_data = torch.tensor([MinMaxScaler().fit_transform(step_data) for step_data in data])
-        for i, e in enumerate(self.embs):
+    def _scaler_past(self, input):
+        for i, e in enumerate(self.embs_past):
+            input[:,:,i] = input[:, :, i] / (e-1)
+        return input
+    def _scaler_fut(self, input):
+        for i, e in enumerate(self.embs_fut):
             input[:,:,i] = input[:, :, i] / (e-1)
         return input
-    def __build_tupla_indexes(self, size, target_idx, current_idx):
-        permute = list(range(size))
-        history = dict()
-        for j, i in enumerate(target_idx):
-            c = history.get(current_idx[j], current_idx[j])
-            permute[i], permute[c] = current_idx[j], i
-            history[i] = current_idx[j]
-    def __permute_indexes(self, values, target_idx, current_idx):
-        if current_idx is None or target_idx is None:
-            raise ValueError("Indexes cannot be None")
-        if sorted(current_idx) != sorted(target_idx):
-            return values[..., self.__build_tupla_indexes(values.shape[-1], target_idx, current_idx)]
-        return values
-    def __extend_with_quantile_variables(self, x, original_indexes):
-        covariate_indexes = [i for i in range(x.shape[-1]) if i not in original_indexes]
-        covariate_tensors = x[..., covariate_indexes]
-        new_tensors = [x[..., target_index] for target_index in original_indexes for _ in range(3)]
-        new_original_indexes = list(range(len(original_indexes) * 3))
-        return torch.cat([torch.stack(new_tensors, dim=-1), covariate_tensors], dim=-1), new_original_indexes
     def forward(self, batch):
         x_enc = batch['x_num_past']
         original_indexes = batch['idx_target'][0].tolist()
-        original_indexes_future = batch['idx_target_future'][0].tolist()
-        if self.extend_variables:
-            x_enc, original_indexes = self.__extend_with_quantile_variables(x_enc, original_indexes)
         if 'x_cat_past' in batch.keys():
             x_mark_enc = batch['x_cat_past'].to(torch.float32).to(self.device)
-            x_mark_enc = self.__scaler(x_mark_enc)
+            x_mark_enc = self._scaler_past(x_mark_enc)
             past_values = torch.cat((x_enc,x_mark_enc), axis=-1).type(torch.float32)
         else:
             past_values = x_enc
-        x_dec = torch.tensor([]).to(self.device)
+        future_values = torch.zeros_like(past_values)
+        future_values = future_values[:,:self.future_steps,:]
         if 'x_num_future' in batch.keys():
-            x_dec = batch['x_num_future'].to(self.device)
-            if self.extend_variables:
-                x_dec, original_indexes_future = self.__extend_with_quantile_variables(x_dec, original_indexes_future)
+            future_values[:,:,self.index_fut] = batch['x_num_future'].to(self.device)
         if 'x_cat_future' in batch.keys():
             x_mark_dec = batch['x_cat_future'].to(torch.float32).to(self.device)
-            x_mark_dec = self.__scaler(x_mark_dec)
-            future_values = torch.cat((x_dec, x_mark_dec), axis=-1).type(torch.float32)
-        else:
-            future_values = x_dec
-        if self.remove_last:
-            idx_target = batch['idx_target'][0]
-            x_start = x_enc[:,-1,idx_target].unsqueeze(1)
-            x_enc[:,:,idx_target]-=x_start
-        past_values = self.__permute_indexes(past_values, self.model.prediction_channel_indices, original_indexes)
+            x_mark_dec = self._scaler_fut(x_mark_dec)
+            future_values[:,:,self.index_cat_fut] = x_mark_dec
-        future_values = self.__permute_indexes(future_values, self.model.prediction_channel_indices, original_indexes_future)
-        freq_token = get_frequency_token(self.freq).repeat(x_enc.shape[0])
+        #investigating!!
+        freq_token = get_frequency_token(self.freq).repeat(past_values.shape[0])
         res = self.model(
             past_values= past_values,
-            future_values= future_values,
+            future_values= future_values,# future_values if future_values.shape[0]>0 else None,
             past_observed_mask = None,
             future_observed_mask = None,
             output_hidden_states =  False,
             return_dict = False,
-            freq_token= freq_token,
+            freq_token= freq_token, ##investigating
             static_categorical_values = None
         )
-        #args = None
-        #res = self.model(**args)
         BS = res.shape[0]
         return res.reshape(BS,self.future_steps,-1,self.mul)

dsipts/models/base.py CHANGED Viewed

@@ -111,8 +111,11 @@ class Base(pl.LightningModule):
         self.train_loss_epoch = -100.0
         self.verbose = verbose
         self.name = self.__class__.__name__
-        self.train_epoch_metrics = []
-        self.validation_epoch_metrics = []
+        self.register_buffer("train_epoch_metrics", torch.tensor(0.0))
+        self.register_buffer("validation_epoch_metrics", torch.tensor(0.0))
+        self.register_buffer("train_epoch_count", torch.tensor(0))
+        self.register_buffer("validation_epoch_count", torch.tensor(0))
         self.use_quantiles = True if len(quantiles)>0 else False
         self.quantiles =  quantiles
@@ -136,9 +139,9 @@ class Base(pl.LightningModule):
             self.is_classification = False
             if len(self.quantiles)>0:
                 if self.loss_type=='cprs':
-                    self.use_quantiles = False
+                    self.use_quantiles = True
                     self.mul = len(self.quantiles)
-                    self.loss = CPRS()
+                    self.loss = CPRS(alpha=self.persistence_weight)
                 else:
                     assert len(self.quantiles)==3, beauty_string('ONLY 3 quantiles premitted','info',True)
                     self.use_quantiles = True
@@ -193,7 +196,9 @@ class Base(pl.LightningModule):
         """
         if self.loss_type=='cprs':
             tmp = self(batch)
-            return tmp.mean(axis=-1)
+            tmp = torch.quantile(tmp, torch.tensor([0.05, 0.5, 0.95]), dim=-1).permute(1,2,3,0)
+            return tmp
+            #return tmp.mean(axis=-1).unsqueeze(-1)
         return self(batch)
@@ -293,7 +298,8 @@ class Base(pl.LightningModule):
                 y_hat = self(batch)
                 loss = self.compute_loss(batch,y_hat)
-        self.train_epoch_metrics.append(loss.item())
+        self.train_epoch_metrics+=loss.detach()
+        self.train_epoch_count +=1
         return loss
@@ -309,27 +315,20 @@ class Base(pl.LightningModule):
             y_hat = self(batch)
             score = 0
         if batch_idx==0:
-            if self.use_quantiles:
-                idx = 1
-            else:
-                idx = 0
-            #track the predictions! We can do better than this but maybe it is better to firstly update pytorch-lightening
             if self.count_epoch%int(max(self.trainer.max_epochs/100,1))==1:
-                for i in range(batch['y'].shape[2]):
-                    real =  batch['y'][0,:,i].cpu().detach().numpy()
-                    pred =  y_hat[0,:,i,idx].cpu().detach().numpy()
-                    fig, ax = plt.subplots(figsize=(7,5))
-                    ax.plot(real,'o-',label='real')
-                    ax.plot(pred,'o-',label='pred')
-                    ax.legend()
-                    ax.set_title(f'Channel {i} first element first batch validation {int(100*self.count_epoch/self.trainer.max_epochs)}%')
-                    self.logger.experiment.track(Image(fig), name='cm_training_end')
-                    #self.log(f"example_{i}", np.stack([real, pred]).T,sync_dist=True)
-        return self.compute_loss(batch,y_hat)+score
+                self._val_outputs.append({
+                    "y": batch['y'].detach().cpu(),
+                    "y_hat": y_hat.detach().cpu()
+                })
+        self.validation_epoch_metrics = (self.compute_loss(batch,y_hat)+score).detach()
+        self.validation_epoch_count+=1
+        return None #self.compute_loss(batch,y_hat)+score
+    def on_validation_start(self):
+        # reset buffer each epoch
+        self._val_outputs = []
     def validation_epoch_end(self, outs):
         """
@@ -337,14 +336,30 @@ class Base(pl.LightningModule):
         :meta private:
         """
-        if len(outs)==0:
-            loss = 10000
-            beauty_string(f'THIS IS A BUG, It should be polulated','info',self.verbose)
-        else:
-            loss = torch.stack(outs).mean()
-        self.log("val_loss", loss.item(),sync_dist=True)
-        beauty_string(f'Epoch: {self.count_epoch} train error: {self.train_loss_epoch:.4f} validation loss: {loss.item():.4f}','info',self.verbose)
+        if len(self._val_outputs)>0:
+            ys = torch.cat([o["y"] for o in self._val_outputs])
+            y_hats = torch.cat([o["y_hat"] for o in self._val_outputs])
+            if self.use_quantiles:
+                idx = 1
+            else:
+                idx = 0
+            for i in range(ys.shape[2]):
+                real =  ys[0,:,i].cpu().detach().numpy()
+                pred =  y_hats[0,:,i,idx].cpu().detach().numpy()
+                fig, ax = plt.subplots(figsize=(7,5))
+                ax.plot(real,'o-',label='real')
+                ax.plot(pred,'o-',label='pred')
+                ax.legend()
+                ax.set_title(f'Channel {i} first element first batch validation {int(100*self.count_epoch/self.trainer.max_epochs)}%')
+                self.logger.experiment.track(Image(fig), name='cm_training_end')
+                #self.log(f"example_{i}", np.stack([real, pred]).T,sync_dist=True)
+                plt.close(fig)
+        avg = self.validation_epoch_metrics/self.validation_epoch_count
+        self.validation_epoch_metrics.zero_()
+        self.validation_epoch_count.zero_()
+        self.log("val_loss", avg,sync_dist=True)
+        beauty_string(f'Epoch: {self.count_epoch} train error: {self.train_loss_epoch:.4f} validation loss: {avg:.4f}','info',self.verbose)
     def training_epoch_end(self, outs):
         """
@@ -353,12 +368,11 @@ class Base(pl.LightningModule):
         :meta private:
         """
-        loss = sum(outs['loss'] for outs in outs) / len(outs)
-        self.log("train_loss", loss.item(),sync_dist=True)
+        loss = self.train_epoch_metrics/self.global_step
+        self.log("train_loss", loss,sync_dist=True)
         self.count_epoch+=1
-        self.train_loss_epoch = loss.item()
+        self.train_loss_epoch = loss
     def compute_loss(self,batch,y_hat):
         """
         custom loss calculation

dsipts/models/base_v2.py CHANGED Viewed

@@ -15,7 +15,6 @@ from typing import List, Union
 from .utils import QuantileLossMO, CPRS
 import torch.nn as nn
 def standardize_momentum(x,order):
     mean = torch.mean(x,1).unsqueeze(1).repeat(1,x.shape[1],1)
     num = torch.pow(x-mean,order).mean(axis=1)
@@ -113,8 +112,13 @@ class Base(pl.LightningModule):
         self.train_loss_epoch = -100.0
         self.verbose = verbose
         self.name = self.__class__.__name__
-        self.train_epoch_metrics = []
-        self.validation_epoch_metrics = []
+        #self.train_epoch_metrics = 0
+        #self.validation_epoch_metrics = 0
+        self.register_buffer("train_epoch_metrics", torch.tensor(0.0))
+        self.register_buffer("validation_epoch_metrics", torch.tensor(0.0))
+        self.register_buffer("train_epoch_count", torch.tensor(0))
+        self.register_buffer("validation_epoch_count", torch.tensor(0))
         self.use_quantiles = True if len(quantiles)>0 else False
         self.quantiles =  quantiles
@@ -138,9 +142,9 @@ class Base(pl.LightningModule):
             self.is_classification = False
             if len(self.quantiles)>0:
                 if self.loss_type=='cprs':
-                    self.use_quantiles = False
+                    self.use_quantiles = True
                     self.mul = len(self.quantiles)
-                    self.loss = CPRS()
+                    self.loss = CPRS(alpha=self.persistence_weight)
                 else:
                     assert len(self.quantiles)==3, beauty_string('ONLY 3 quantiles premitted','info',True)
                     self.use_quantiles = True
@@ -197,7 +201,9 @@ class Base(pl.LightningModule):
         if self.loss_type=='cprs':
             tmp = self(batch)
-            return tmp.mean(axis=-1)
+            tmp = torch.quantile(tmp, torch.tensor([0.05, 0.5, 0.95]), dim=-1).permute(1,2,3,0)
+            return tmp
+            #return tmp.mean(axis=-1).unsqueeze(-1)
         return self(batch)
@@ -297,7 +303,8 @@ class Base(pl.LightningModule):
                 y_hat = self(batch)
                 loss = self.compute_loss(batch,y_hat)
-        self.train_epoch_metrics.append(loss.item())
+        self.train_epoch_metrics+=loss.detach()
+        self.train_epoch_count +=1
         return loss
@@ -314,41 +321,54 @@ class Base(pl.LightningModule):
             y_hat = self(batch)
             score = 0
         if batch_idx==0:
-            if self.use_quantiles:
-                idx = 1
-            else:
-                idx = 0
             #track the predictions! We can do better than this but maybe it is better to firstly update pytorch-lightening
             if self.count_epoch%int(max(self.trainer.max_epochs/100,1))==1:
+                self._val_outputs.append({
+                    "y": batch['y'].detach().cpu(),
+                    "y_hat": y_hat.detach().cpu()
+                })
+        self.validation_epoch_metrics+= (self.compute_loss(batch,y_hat)+score).detach()
+        self.validation_epoch_count+=1
+        return None
-                for i in range(batch['y'].shape[2]):
-                    real =  batch['y'][0,:,i].cpu().detach().numpy()
-                    pred =  y_hat[0,:,i,idx].cpu().detach().numpy()
-                    fig, ax = plt.subplots(figsize=(7,5))
-                    ax.plot(real,'o-',label='real')
-                    ax.plot(pred,'o-',label='pred')
-                    ax.legend()
-                    ax.set_title(f'Channel {i} first element first batch validation {int(100*self.count_epoch/self.trainer.max_epochs)}%')
-                    self.logger.experiment.track(Image(fig), name='cm_training_end')
-                    #self.log(f"example_{i}", np.stack([real, pred]).T,sync_dist=True)
-        self.validation_epoch_metrics.append(self.compute_loss(batch,y_hat)+score)
-        return
+    def on_validation_start(self):
+        # reset buffer each epoch
+        self._val_outputs = []
     def on_validation_epoch_end(self):
         """
         pythotrch lightening stuff
         :meta private:
-        """
+        """
-        if len(self.validation_epoch_metrics)==0:
-            avg = 10000
-            beauty_string(f'THIS IS A BUG, It should be polulated','info',self.verbose)
-        else:
-            avg = torch.stack(self.validation_epoch_metrics).mean()
-        self.validation_epoch_metrics = []
+        if len(self._val_outputs)>0:
+            ys = torch.cat([o["y"] for o in self._val_outputs])
+            y_hats = torch.cat([o["y_hat"] for o in self._val_outputs])
+            if self.use_quantiles:
+                idx = 1
+            else:
+                idx = 0
+            for i in range(ys.shape[2]):
+                real =  ys[0,:,i].cpu().detach().numpy()
+                pred =  y_hats[0,:,i,idx].cpu().detach().numpy()
+                fig, ax = plt.subplots(figsize=(7,5))
+                ax.plot(real,'o-',label='real')
+                ax.plot(pred,'o-',label='pred')
+                ax.legend()
+                ax.set_title(f'Channel {i} first element first batch validation {int(100*self.count_epoch/self.trainer.max_epochs)}%')
+                self.logger.experiment.track(Image(fig), name='cm_training_end')
+                #self.log(f"example_{i}", np.stack([real, pred]).T,sync_dist=True)
+                plt.close(fig)
+        avg = self.validation_epoch_metrics/self.validation_epoch_count
+        self.validation_epoch_metrics.zero_()
+        self.validation_epoch_count.zero_()
         self.log("val_loss", avg,sync_dist=True)
         beauty_string(f'Epoch: {self.count_epoch} train error: {self.train_loss_epoch:.4f} validation loss: {avg:.4f}','info',self.verbose)
@@ -359,14 +379,12 @@ class Base(pl.LightningModule):
         :meta private:
         """
-        if len(self.train_epoch_metrics)==0:
-            avg = 0
-            beauty_string(f'THIS IS A BUG, It should be polulated','info',self.verbose)
-        else:
-            avg = np.stack(self.train_epoch_metrics).mean()
+        avg = self.train_epoch_metrics/self.train_epoch_count
         self.log("train_loss", avg,sync_dist=True)
         self.count_epoch+=1
-        self.train_epoch_metrics = []
+        self.train_epoch_metrics.zero_()
+        self.train_epoch_count.zero_()
         self.train_loss_epoch = avg
     def compute_loss(self,batch,y_hat):

dsipts/models/utils.py CHANGED Viewed

@@ -633,7 +633,7 @@ class CPRS(nn.Module):
     with large ensembles.
     """
-    def __init__(self, alpha=0.95, reduction='mean'):
+    def __init__(self, alpha=0.5, reduction='mean'):
         super().__init__()
         self.alpha = alpha
         self.reduction = reduction
@@ -674,17 +674,19 @@ class CPRS(nn.Module):
         # Create mask to exclude diagonal (i=j)
         mask = ~torch.eye(n_members, dtype=torch.bool, device=ensemble.device)
         mask = mask.view(1, n_members, n_members, *[1]*(len(ensemble.shape)-2))
         # Apply mask and compute mean
-        pairwise_term = (pairwise_diffs * mask).sum(dim=(1, 2)) / (n_members * (n_members - 1))
+        pairwise_term = (pairwise_diffs * mask).sum(dim=(1, 2)) ##formula 3 second term
         # Combine terms according to afCRPS formula
-        loss = mae_term - (1 - epsilon) * pairwise_term
+        loss = mae_term - (1 - epsilon) * pairwise_term/ (2*n_members * (n_members - 1))
         # Apply weights if provided
         if weights is not None:
             loss = loss * weights
+        #if loss.mean()<-2:
+        #    import pdb
+        #    pdb.set_trace()
         # Apply reduction
         if self.reduction == 'none':
             return loss

{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: dsipts
-Version: 1.1.9
+Version: 1.1.11
 Summary: Unified library for timeseries modelling
 Author-email: Andrea Gobbi <agobbi@fbk.eu>
 Project-URL: Homepage, https://github.com/DSIP-FBK/DSIPTS

{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/RECORD RENAMED Viewed

@@ -3,7 +3,7 @@ dsipts/data_management/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3
 dsipts/data_management/monash.py,sha256=aZxq9FbIH6IsU8Lwou1hAokXjgOAK-wdl2VAeFg2k4M,13075
 dsipts/data_management/public_datasets.py,sha256=yXFzOZZ-X0ZG1DoqVU-zFmEGVMc2033YDQhRgYxY8ws,6793
 dsipts/data_structure/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-dsipts/data_structure/data_structure.py,sha256=87VtKelx2EPoddrVYcja9dO5rQqaS83vZlQB_NY54PI,58994
+dsipts/data_structure/data_structure.py,sha256=uyGkc1eDjETpXb8rgMMbRUjG8i9Xiiu6vZc64xfTiew,59914
 dsipts/data_structure/modifiers.py,sha256=qlry9dfw8pEE0GrvgwROZJkJ6oPpUnjEHPIG5qIetss,7948
 dsipts/data_structure/utils.py,sha256=QwfKPZgSy6DIw5n6ztOdPJIAnzo4EnlMTgRbpiWnyko,6593
 dsipts/models/Autoformer.py,sha256=ddGT3L9T4gAXNJHx1TsuYZy7j63Anyr0rkqqXaOoSu4,8447
@@ -13,7 +13,7 @@ dsipts/models/Diffusion.py,sha256=pUujnrdeSSkj4jC1RORbcptt03KpuCsGVwg414o4LPg,40
 dsipts/models/DilatedConv.py,sha256=_c0NvFuT3vbYmo9A8cQchGo1XVb0qOpzBprNEkkAgiE,14292
 dsipts/models/DilatedConvED.py,sha256=fXk1-EWiRC5J_VIepTjYKya_D02SlEAkyiJcCjhW_XU,14004
 dsipts/models/Duet.py,sha256=EharWHT_r7tEYIk7BkozVLPZ0xptE5mmQmeFGm3uBsA,7628
-dsipts/models/ITransformer.py,sha256=jO8wxLaC06Wgu4GncrFFTISv3pVyfFLLhQvbEOYsz6Y,7368
+dsipts/models/ITransformer.py,sha256=qMsk27PqpnakNY1YM_rbkj8MO6BaG06N3b6m30Oa0RQ,7256
 dsipts/models/Informer.py,sha256=ByJ00qGk12ONFF7NZWAACzxxRb5UXcu5wpkGMYX9Cq4,6920
 dsipts/models/LinearTS.py,sha256=B0-Sz4POwUyl-PN2ssSx8L-ZHgwrQQPcMmreyvSS47U,9104
 dsipts/models/PatchTST.py,sha256=Z7DM1Kw5Ym8Hh9ywj0j9RuFtKaz_yVZmKFIYafjceM8,9061
@@ -23,14 +23,14 @@ dsipts/models/Samformer.py,sha256=s61Hi1o9iuw-KgSBPfiE80oJcK1j2fUA6N9f5BJgKJc,55
 dsipts/models/Simple.py,sha256=K82E88A62NhV_7U9Euu2cn3Q8P287HDR7eIy7VqgwbM,3909
 dsipts/models/TFT.py,sha256=JO2-AKIUag7bfm9Oeo4KmGfdYZJbzQBHPDqGVg0WUZI,13830
 dsipts/models/TIDE.py,sha256=i8qXac2gImEVgE2X6cNxqW5kuQP3rzWMlQNdgJbNmKM,13033
-dsipts/models/TTM.py,sha256=WpCiTN0qX3JFO6xgPLedoqMKXUC2pQpNAe9ee-Rw89Q,10602
+dsipts/models/TTM.py,sha256=gc-8yzEtn8ZdRVvsZfZvz7iE-RgqpZc-JGmOCQr4U_0,5215
 dsipts/models/TimeXER.py,sha256=aCg0003LxYZzqZWyWugpbW_iOybcdHN4OH6_v77qp4o,7056
 dsipts/models/VQVAEA.py,sha256=sNJi8UZh-10qEIKcZK3SzhlOFUUjvqjoglzeZBFaeZM,13789
 dsipts/models/VVA.py,sha256=BnPkJ0Nzue0oShSHZVRNlf5RvT0Iwtf9bx19vLB9Nn0,11939
 dsipts/models/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-dsipts/models/base.py,sha256=-K6ZxmXism231GqBxM3-pXE_KA4a4QWuYJ6FM_uSRl4,18859
-dsipts/models/base_v2.py,sha256=39EJO3m00HvT3zkn8PO67YEckAVa3Ez3NQ5oEnwz9g8,19137
-dsipts/models/utils.py,sha256=eBEpczdHn--ftK9I0pOiSY4ANGLzkw1WIL3SOoV9y7Y,24412
+dsipts/models/base.py,sha256=Gqsycy8ZXGaIVx9vvmYRpBCqdUxGE4tvC5ltgxlpEYY,19640
+dsipts/models/base_v2.py,sha256=eraXo1IBEQmyW41f1dz3Q-i-61vZ2AS3tVz6_X8J0Pg,19886
+dsipts/models/utils.py,sha256=kjTwyktNCFMpPUy6zoleBCSKlvMvK_Jkgyh2T1OXg3E,24497
 dsipts/models/autoformer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 dsipts/models/autoformer/layers.py,sha256=xHt8V1lKdD1cIvgxXdDbI_EqOz4zgOQ6LP8l7M1pAxM,13276
 dsipts/models/crossformer/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -76,7 +76,7 @@ dsipts/models/vva/minigpt.py,sha256=bg0JddqSD322uxSGexen3nPXL_hGTsk3vNLR62d7-w8,
 dsipts/models/vva/vqvae.py,sha256=RzCQ_M9xBprp7_x20dSV3EQqlO0FjPUGWV-qdyKrQsM,19680
 dsipts/models/xlstm/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 dsipts/models/xlstm/xLSTM.py,sha256=ZKZZmffmIq1Vb71CR4GSyM8viqVx-u0FChxhcNgHub8,10081
-dsipts-1.1.9.dist-info/METADATA,sha256=vraJDpYWc4hhcOfaj3C4E5hACrTNlYSEgGsT2zKyiPs,24794
-dsipts-1.1.9.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-dsipts-1.1.9.dist-info/top_level.txt,sha256=i6o0rf5ScFwZK21E89dSKjVNjUBkrEQpn0-Vij43748,7
-dsipts-1.1.9.dist-info/RECORD,,
+dsipts-1.1.11.dist-info/METADATA,sha256=fbMTKqi7b_vlvtmVSp5XJdkFrEC9SFF3DG_fKy58k_8,24795
+dsipts-1.1.11.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+dsipts-1.1.11.dist-info/top_level.txt,sha256=i6o0rf5ScFwZK21E89dSKjVNjUBkrEQpn0-Vij43748,7
+dsipts-1.1.11.dist-info/RECORD,,

{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/WHEEL RENAMED Viewed

File without changes

{dsipts-1.1.9.dist-info → dsipts-1.1.11.dist-info}/top_level.txt RENAMED Viewed

File without changes

dsipts 1.1.9__py3-none-any.whl → 1.1.11__py3-none-any.whl

dsipts 1.1.9py3-none-any.whl → 1.1.11py3-none-any.whl