WenjieDu
diff --git a/‎README.md
+1-1 b/‎README.md
+1-1
diff --git a/‎README_zh.md
+1-1 b/‎README_zh.md
+1-1
diff --git a/‎docs/index.rst
+1-1 b/‎docs/index.rst
+1-1
diff --git a/‎docs/pypots.forecasting.rst
+9 b/‎docs/pypots.forecasting.rst
+9
diff --git a/‎pypots/forecasting/__init__.py
+2 b/‎pypots/forecasting/__init__.py
+2
diff --git a/‎pypots/forecasting/bttf/core.py
+1-1 b/‎pypots/forecasting/bttf/core.py
+1-1
diff --git a/‎pypots/forecasting/timemixer/__init__.py
+13 b/‎pypots/forecasting/timemixer/__init__.py
+13
diff --git a/‎pypots/forecasting/timemixer/core.py
+105 b/‎pypots/forecasting/timemixer/core.py
+105
diff --git a/‎pypots/forecasting/timemixer/data.py
+28 b/‎pypots/forecasting/timemixer/data.py
+28
@@ -123,7 +123,7 @@ The paper references and links are all listed at the bottom of this file.
 | LLM           | Time-LLM[^45]                                                                                                                    |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | TEFN🧑‍🔧[^39]                                                                                                                   |    ✅     |    ✅     |          |          |          | `2024 - arXiv`                                     |
 | Neural Net    | FITS🧑‍🔧[^41]                                                                                                                   |    ✅     |    ✅     |          |          |          | `2024 - ICLR`                                      |
-| Neural Net    | TimeMixer[^37]                                                                                                                   |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
+| Neural Net    | TimeMixer[^37]                                                                                                                   |    ✅     |    ✅     |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | iTransformer🧑‍🔧[^24]                                                                                                           |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | ModernTCN[^38]                                                                                                                   |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | ImputeFormer🧑‍🔧[^34]                                                                                                           |    ✅     |          |          |          |          | `2024 - KDD`                                       |
 
@@ -108,7 +108,7 @@ PyPOTS当前支持多变量POTS数据的插补, 预测, 分类, 聚类以及异
 | LLM           | Time-LLM[^45]                                                                                                                    |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | TEFN🧑‍🔧[^39]                                                                                                                   |    ✅     |    ✅     |          |          |          | `2024 - arXiv`                                     |
 | Neural Net    | FITS🧑‍🔧[^41]                                                                                                                   |    ✅     |    ✅     |          |          |          | `2024 - ICLR`                                      |
-| Neural Net    | TimeMixer[^37]                                                                                                                   |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
+| Neural Net    | TimeMixer[^37]                                                                                                                   |    ✅     |    ✅     |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | iTransformer🧑‍🔧[^24]                                                                                                           |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | ModernTCN[^38]                                                                                                                   |    ✅     |          |          |          |          | `2024 - ICLR`                                      |
 | Neural Net    | ImputeFormer🧑‍🔧[^34]                                                                                                           |    ✅     |          |          |          |          | `2024 - KDD`                                       |
 
@@ -137,7 +137,7 @@ The paper references are all listed at the bottom of this readme file.
 +----------------+-----------------------------------------------------------+------+------+------+------+------+-----------------------+
 | Neural Net     | FITS🧑‍🔧           :cite:`xu2024fits`                    |  ✅  |  ✅  |      |      |      | ``2024 - ICLR``       |
 +----------------+-----------------------------------------------------------+------+------+------+------+------+-----------------------+
-| Neural Net     | TimeMixer      :cite:`wang2024timemixer`                  |  ✅  |      |      |      |      | ``2024 - ICLR``       |
+| Neural Net     | TimeMixer      :cite:`wang2024timemixer`                  |  ✅  |  ✅  |      |      |      | ``2024 - ICLR``       |
 +----------------+-----------------------------------------------------------+------+------+------+------+------+-----------------------+
 | Neural Net     | iTransformer🧑‍🔧 :cite:`liu2024itransformer`             |  ✅  |      |      |      |      | ``2024 - ICLR``       |
 +----------------+-----------------------------------------------------------+------+------+------+------+------+-----------------------+
 
@@ -28,6 +28,15 @@ pypots.forecasting.fits
    :show-inheritance:
    :inherited-members:
 
+pypots.forecasting.timemixer
+------------------------------
+
+.. automodule:: pypots.forecasting.timemixer
+   :members:
+   :undoc-members:
+   :show-inheritance:
+   :inherited-members:
+
 pypots.forecasting.csdi
 ------------------------------
 
 
@@ -9,6 +9,7 @@
 from .csdi import CSDI
 from .fits import FITS
 from .tefn import TEFN
+from .timemixer import TimeMixer
 from .transformer import Transformer
 
 __all__ = [
@@ -17,4 +18,5 @@
     "Transformer",
     "FITS",
     "TEFN",
+    "TimeMixer",
 ]
@@ -200,7 +200,7 @@ def BTTF_forecast(
         "start_time should be larger than -1, "
         "namely the number of the input tensor's time steps should be larger than pred_step."
     )
-    assert start_time >= np.max(time_lags), "start_time should be >= max(time_lags)"
+    assert start_time >= np.max(time_lags), f"start_time {start_time} should be >= max(time_lags) {np.max(time_lags)}"
     max_count = int(np.ceil(pred_step / multi_step))
     tensor_hat = np.zeros((dim1, dim2, max_count * multi_step))
 
 
@@ -0,0 +1,13 @@
+"""
+
+"""
+
+# Created by Wenjie Du <[email protected]>
+# License: BSD-3-Clause
+
+
+from .model import TimeMixer
+
+__all__ = [
+    "TimeMixer",
+]
@@ -0,0 +1,105 @@
+"""
+The core wrapper assembles the submodules of TimeMixer forecasting model
+and takes over the forward progress of the algorithm.
+
+"""
+
+# Created by Wenjie Du <[email protected]>
+# License: BSD-3-Clause
+
+import torch
+import torch.nn as nn
+
+from ...nn.functional import nonstationary_norm, nonstationary_denorm
+from ...nn.functional.error import calc_mse
+from ...nn.modules.timemixer import BackboneTimeMixer
+
+
+class _TimeMixer(nn.Module):
+    def __init__(
+        self,
+        n_steps: int,
+        n_features: int,
+        n_pred_steps: int,
+        n_pred_features: int,
+        term: str,
+        n_layers: int,
+        d_model: int,
+        d_ffn: int,
+        dropout: float,
+        top_k: int,
+        channel_independence: bool,
+        decomp_method: str,
+        moving_avg: int,
+        downsampling_layers: int,
+        downsampling_window: int,
+        apply_nonstationary_norm: bool = False,
+    ):
+        super().__init__()
+
+        self.n_pred_steps = n_pred_steps
+        self.n_pred_features = n_pred_features
+        self.apply_nonstationary_norm = apply_nonstationary_norm
+
+        assert term in ["long", "short"], "forecasting term should be either 'long' or 'short'"
+        self.model = BackboneTimeMixer(
+            task_name=term + "_term_forecast",
+            n_steps=n_steps,
+            n_features=n_features,
+            n_pred_steps=n_pred_steps,
+            n_pred_features=n_pred_features,
+            n_layers=n_layers,
+            d_model=d_model,
+            d_ffn=d_ffn,
+            dropout=dropout,
+            channel_independence=channel_independence,
+            decomp_method=decomp_method,
+            top_k=top_k,
+            moving_avg=moving_avg,
+            downsampling_layers=downsampling_layers,
+            downsampling_window=downsampling_window,
+            downsampling_method="avg",
+            use_future_temporal_feature=False,
+        )
+
+        # for the imputation task, the output dim is the same as input dim
+        self.output_projection = nn.Linear(n_features, n_pred_features)
+
+    def forward(self, inputs: dict) -> dict:
+        X, missing_mask = inputs["X"], inputs["missing_mask"]
+
+        if self.training:
+            X_pred, X_pred_missing_mask = inputs["X_pred"], inputs["X_pred_missing_mask"]
+        else:
+            batch_size = X.shape[0]
+            X_pred, X_pred_missing_mask = (
+                torch.zeros(batch_size, self.n_pred_steps, self.n_pred_features),
+                torch.ones(batch_size, self.n_pred_steps, self.n_pred_features),
+            )
+
+        if self.apply_nonstationary_norm:
+            # Normalization from Non-stationary Transformer
+            X, means, stdev = nonstationary_norm(X, missing_mask)
+
+        # TimesMixer processing
+        enc_out = self.model.forecast(X, missing_mask)
+
+        if self.apply_nonstationary_norm:
+            # De-Normalization from Non-stationary Transformer
+            enc_out = nonstationary_denorm(enc_out, means, stdev)
+
+        # project back the original data space
+        forecasting_result = self.output_projection(enc_out)
+        # the raw output has length = n_steps+n_pred_steps, we only need the last n_pred_steps
+        forecasting_result = forecasting_result[:, -self.n_pred_steps :]
+
+        results = {
+            "forecasting_data": forecasting_result,
+        }
+
+        # if in training mode, return results with losses
+        if self.training:
+            # `loss` is always the item for backward propagating to update the model
+            results["loss"] = calc_mse(X_pred, forecasting_result, X_pred_missing_mask)
+
+        return results
@@ -0,0 +1,28 @@
+"""
+Dataset class for the forecasting model TimeMixer.
+"""
+
+# Created by Wenjie Du <[email protected]>
+# License: BSD-3-Clause
+
+from typing import Union
+
+from ...data.dataset import BaseDataset
+
+
+class DatasetForTimeMixer(BaseDataset):
+    """Dataset for TimeMixer forecasting model."""
+
+    def __init__(
+        self,
+        data: Union[dict, str],
+        return_X_pred=True,
+        file_type: str = "hdf5",
+    ):
+        super().__init__(
+            data=data,
+            return_X_ori=False,
+            return_X_pred=return_X_pred,
+            return_y=False,
+            file_type=file_type,
+        )
Original file line number	Diff line number	Diff line change
`@@ -200,7 +200,7 @@ def BTTF_forecast(`
`200`	`200`	`"start_time should be larger than -1, "`
`201`	`201`	`"namely the number of the input tensor's time steps should be larger than pred_step."`
`202`	`202`	`)`
`203`		`- assert start_time >= np.max(time_lags), "start_time should be >= max(time_lags)"`
	`203`	`+ assert start_time >= np.max(time_lags), f"start_time {start_time} should be >= max(time_lags) {np.max(time_lags)}"`
`204`	`204`	`max_count = int(np.ceil(pred_step / multi_step))`
`205`	`205`	`tensor_hat = np.zeros((dim1, dim2, max_count * multi_step))`
`206`	`206`