Merge branch 'main' into main

Pinaka07 · web-flow · commit aef2d2b453cd · 2025-07-09T23:03:43.000+05:30
diff --git a/pyproject.toml b/pyproject.toml
@@ -220,5 +220,8 @@ filterwarnings = [
     "ignore:The number of training samples \\(\\d+\\) is smaller than the logging interval Trainer\\(:UserWarning",
     "ignore:The dataloader, [\\_\\s]+ \\d+, does not have many workers which may be a bottleneck.:UserWarning",
     "ignore:Consider increasing the value of the `num_workers` argument`:UserWarning",
+    "default::DeprecationWarning",
+    "default::PendingDeprecationWarning",
+    "default::FutureWarning",
     "ignore::UserWarning"
 ]
diff --git a/pytorch_forecasting/data/encoders.py b/pytorch_forecasting/data/encoders.py
@@ -708,47 +708,82 @@ def transform(
             target_scale = self.get_parameters().numpy()[None, :]
         center = target_scale[..., 0]
         scale = target_scale[..., 1]
+
+        if not isinstance(y, torch.Tensor):
+            if isinstance(y, (pd.Series)):
+                index = y.index
+                pandas_dtype = y.dtype
+                y = y.values
+                y_was = "pandas"
+                y = torch.as_tensor(y)
+            elif isinstance(y, np.ndarray):
+                y_was = "numpy"
+                np_dtype = y.dtype
+                try:
+                    y = torch.from_numpy(y)
+                except TypeError:
+                    y = torch.as_tensor(y.astype(np.float32))
+        else:
+            y_was = "torch"
+            torch_dtype = y.dtype
+        if isinstance(center, np.ndarray):
+            center = torch.from_numpy(center)
+        if isinstance(scale, np.ndarray):
+            scale = torch.from_numpy(scale)
         if y.ndim > center.ndim:  # multiple batches -> expand size
             center = center.view(*center.size(), *(1,) * (y.ndim - center.ndim))
             scale = scale.view(*scale.size(), *(1,) * (y.ndim - scale.ndim))
 
-        # transform
-        dtype = y.dtype
         y = (y - center) / scale
-        try:
-            y = y.astype(dtype)
-        except AttributeError:  # torch.Tensor has `.type()` instead of `.astype()`
-            y = y.type(dtype)
+
+        if y_was == "numpy":
+            numpy_data = y.numpy()
+            if np_dtype.kind in "iu" and numpy_data.dtype.kind == "f":
+                # Original was integer, but normalized data is float
+                y = numpy_data.astype(np.float64)
+            else:
+                y = numpy_data.astype(np_dtype)
+        elif y_was == "pandas":
+            numpy_data = y.numpy()
+            if pandas_dtype.kind in "iu" and numpy_data.dtype.kind == "f":
+                pandas_dtype = np.float64
+            y = pd.Series(numpy_data, index=index, dtype=pandas_dtype)
+        else:
+            y = y.type(torch_dtype)
 
         # return with center and scale or without
         if return_norm:
             return y, target_scale
         else:
             return y
 
-    def inverse_transform(self, y: torch.Tensor) -> torch.Tensor:
+    def inverse_transform(self, y: Union[torch.Tensor, np.ndarray]) -> torch.Tensor:
         """
         Inverse scale.
 
         Parameters
         ----------
-        y: torch.Tensor
+        y: Union[torch.Tensor, np.ndarray])
             scaled data
 
         Returns
         -------
         torch.Tensor
             de-scaled data
         """
+        if isinstance(y, np.ndarray):
+            y = torch.from_numpy(y)
         return self(dict(prediction=y, target_scale=self.get_parameters().unsqueeze(0)))
 
-    def __call__(self, data: dict[str, torch.Tensor]) -> torch.Tensor:
+    def __call__(
+        self, data: dict[str, Union[torch.Tensor, np.ndarray]]
+    ) -> torch.Tensor:
         """
         Inverse transformation but with network output as input.
 
         Parameters
         ----------
-        data: Dict[str, torch.Tensor]
+        data: dict[str, Union[torch.Tensor, np.ndarray]]
             Dictionary with entries
 
             * prediction: data to de-scale
@@ -761,23 +796,29 @@ def __call__(self, data: dict[str, torch.Tensor]) -> torch.Tensor:
         """
         # ensure output dtype matches input dtype
         dtype = data["prediction"].dtype
+        if isinstance(dtype, np.dtype):
+            # convert the array into tensor if it is a numpy array
+            data["prediction"] = torch.as_tensor(data["prediction"])
+
+        prediction = data["prediction"]
 
         # inverse transformation with tensors
         norm = data["target_scale"]
-
+        if isinstance(norm, np.ndarray):
+            norm = torch.from_numpy(norm)
         # use correct shape for norm
-        if data["prediction"].ndim > norm.ndim:
+        if prediction.ndim > norm.ndim:
             norm = norm.unsqueeze(-1)
 
         # transform
-        y = data["prediction"] * norm[:, 1, None] + norm[:, 0, None]
+        y = prediction * norm[:, 1, None] + norm[:, 0, None]
 
         y = self.inverse_preprocess(y)
 
         # return correct shape
-        if data["prediction"].ndim == 1 and y.ndim > 1:
+        if prediction.ndim == 1 and y.ndim > 1:
             y = y.squeeze(0)
-        return y.type(dtype)
+        return y.type(prediction.dtype)
 
 
 class EncoderNormalizer(TorchNormalizer):
diff --git a/tests/test_data/test_encoders.py b/tests/test_data/test_encoders.py
@@ -62,41 +62,51 @@ def test_NaNLabelEncoder_add():
     [
         dict(method="robust"),
         dict(method="robust", method_kwargs=dict(upper=1.0, lower=0.0)),
-        dict(method="robust", data=np.random.randn(100)),
-        dict(data=np.random.randn(100)),
+        dict(method="robust"),
         dict(transformation="log"),
         dict(transformation="softplus"),
         dict(transformation="log1p"),
         dict(transformation="relu"),
         dict(method="identity"),
-        dict(method="identity", data=np.random.randn(100)),
+        dict(
+            method="identity",
+        ),
         dict(center=False),
         dict(max_length=5),
-        dict(data=pd.Series(np.random.randn(100))),
         dict(max_length=[1, 2]),
     ],
 )
-def test_EncoderNormalizer(kwargs):
+@pytest.mark.parametrize("data_type", ["torch", "numpy", "pandas"])
+def test_EncoderNormalizer(kwargs, data_type):
+    transformation = kwargs.get("transformation")
+
+    if transformation in ["log", "log1p", "softplus", "relu"]:
+        base_data = np.random.uniform(0.1, 10, size=100)  # strictly positive
+    else:
+        base_data = np.random.randn(100)
+
+    if data_type == "torch":
+        data = torch.tensor(base_data, dtype=torch.float32)
+    elif data_type == "numpy":
+        data = base_data.astype(np.float32)
+    elif data_type == "pandas":
+        data = pd.Series(base_data.astype(np.float32))
     kwargs.setdefault("method", "standard")
     kwargs.setdefault("center", True)
-    kwargs.setdefault("data", torch.rand(100))
-    data = kwargs.pop("data")
 
     normalizer = EncoderNormalizer(**kwargs)
+    transformed = normalizer.fit_transform(data)
+    inverse = normalizer.inverse_transform(torch.as_tensor(transformed))
 
     if kwargs.get("transformation") in ["relu", "softplus", "log1p"]:
         assert (
-            normalizer.inverse_transform(
-                torch.as_tensor(normalizer.fit_transform(data))
-            )
-            >= 0
+            inverse >= 0
         ).all(), "Inverse transform should yield only positive values"
     else:
+        expected = torch.as_tensor(data)
         assert torch.isclose(
-            normalizer.inverse_transform(
-                torch.as_tensor(normalizer.fit_transform(data))
-            ),
-            torch.as_tensor(data),
+            inverse,
+            expected,
             atol=1e-5,
         ).all(), "Inverse transform should reverse transform"
 

Original file line number	Diff line number	Diff line change
`@@ -220,5 +220,8 @@ filterwarnings = [`
`220`	`220`	`"ignore:The number of training samples \\(\\d+\\) is smaller than the logging interval Trainer\\(:UserWarning",`
`221`	`221`	`"ignore:The dataloader, [\\_\\s]+ \\d+, does not have many workers which may be a bottleneck.:UserWarning",`
`222`	`222`	"ignore:Consider increasing the value of the `num_workers` argument`:UserWarning",
	`223`	`+ "default::DeprecationWarning",`
	`224`	`+ "default::PendingDeprecationWarning",`
	`225`	`+ "default::FutureWarning",`
`223`	`226`	`"ignore::UserWarning"`
`224`	`227`	`]`