Keep torch.tensor instead of np.ndarray

2026-05-24 01:58:27 +00:00 · 2026-02-18 14:41:03 +00:00 · 2026-02-18 14:41:03 +00:00 · b4914823f2
commit b4914823f2
parent 40a7071ed8
1 changed files with 73 additions and 68 deletions
--- a/src/chronos/chronos2/dataset.py
+++ b/src/chronos/chronos2/dataset.py
@ -26,8 +26,8 @@ RawTask = Mapping[str, TensorOrArray | Mapping[str, TensorOrArray | None]]
 class PreparedTask(TypedDict):
    """A preprocessed time series task ready for model training/inference."""

-    context: np.ndarray  # (n_variates, history_length), float32
-    future_covariates: np.ndarray  # (n_variates, prediction_length), float32
+    context: torch.Tensor  # (n_variates, history_length), float32
+    future_covariates: torch.Tensor  # (n_variates, prediction_length), float32
    n_targets: int
    n_covariates: int
    n_future_covariates: int
@ -74,8 +74,15 @@ def validate_and_prepare_single_dict_task(

    Returns
    ------
-    PreparedTask
-        A dictionary containing preprocessed arrays ready for model consumption.
+    A tuple containing:
+    - task_context_tensor: Concatenated tensor of target and past covariates of shape (group_size, history_length),
+        the first `task_n_targets` items along the first axis contain the target variables and the remaining items contain past-only covariates
+        and past values of known future covariates.
+    - task_future_covariates_tensor: Tensor of future covariates of shape (group_size, prediction_length). The last `task_n_future_covariates`
+        items along the first axis contain future covariates. All the remaining elements corresponding to target and past-only covariates are NaNs.
+    - task_n_targets: Number of target variables
+    - task_n_covariates: Total number of covariates (sum of past-only and known future covariates)
+    - task_n_future_covariates: Number of known future covariates
    """

    allowed_keys = {"target", "past_covariates", "future_covariates"}
@ -89,18 +96,18 @@ def validate_and_prepare_single_dict_task(
    if "target" not in keys:
        raise ValueError(f"Element at index {idx} does not contain the required key 'target'")

-    # validate target - convert to numpy float32 (handles bfloat16 and other dtypes)
+    # validate target
    task_target = task["target"]
-    if isinstance(task_target, torch.Tensor):
-        task_target = task_target.to(torch.float32).numpy()
-    task_target = np.asarray(task_target, dtype=np.float32)
+    if isinstance(task_target, np.ndarray):
+        task_target = torch.from_numpy(task_target)
+    assert isinstance(task_target, torch.Tensor)
    if task_target.ndim > 2:
        raise ValueError(
            "When the input is a list of dicts, the `target` should either be 1-d with shape (history_length,) "
            f" or 2-d with shape (n_variates, history_length). Found element at index {idx} with shape {tuple(task_target.shape)}."
        )
    history_length = task_target.shape[-1]
-    task_target = task_target.reshape(-1, history_length)
+    task_target = task_target.view(-1, history_length)

    # validate past_covariates
    cat_encoders: dict = {}
@ -128,81 +135,87 @@ def validate_and_prepare_single_dict_task(
        )

    # create ordered keys: past-only first, then known-future (so known-future are the last rows)
-    task_past_only_keys = [k for k in task_covariates_keys if k not in task_future_covariates_keys]
+    task_past_only_keys = [k for k in task_covariates_keys if k not in task_future_covariates_keys]  # past_only_keys
    task_ordered_covariate_keys = task_past_only_keys + task_future_covariates_keys

-    task_past_covariates_list: list[np.ndarray] = []
+    task_past_covariates_list: list[torch.Tensor] = []
    for key in task_ordered_covariate_keys:
        tensor = task_past_covariates[key]
-        if isinstance(tensor, torch.Tensor):
-            tensor = tensor.to(torch.float32).numpy()
-        tensor = np.asarray(tensor)
-        # apply encoding to categorical variates
-        if not np.issubdtype(tensor.dtype, np.number):
-            # target encoding, if the target is 1-d
-            if task_target.shape[0] == 1:
-                cat_encoder = TargetEncoder(target_type="continuous", smooth=1.0)
-                X = tensor.astype(str).reshape(-1, 1)
-                y = task_target.reshape(-1)
-                mask = np.isfinite(y)
-                cat_encoder.fit(X[mask], y[mask])
-            # ordinal encoding, if the target is > 1-d
-            else:
-                cat_encoder = OrdinalEncoder(handle_unknown="use_encoded_value", unknown_value=np.nan)
-                cat_encoder.fit(tensor.astype(str).reshape(-1, 1))
-            tensor = cat_encoder.transform(tensor.astype(str).reshape(-1, 1)).reshape(tensor.shape)
-            cat_encoders[key] = cat_encoder
+        if isinstance(tensor, np.ndarray):
+            # apply encoding to categorical variates
+            if not np.issubdtype(tensor.dtype, np.number):
+                # target encoding, if the target is 1-d
+                if task_target.shape[0] == 1:
+                    cat_encoder = TargetEncoder(target_type="continuous", smooth=1.0)
+                    X = tensor.astype(str).reshape(-1, 1)
+                    y = task_target.view(-1).numpy()
+                    mask = np.isfinite(y)
+                    X = X[mask]
+                    y = y[mask]
+                    cat_encoder.fit(X, y)
+                # ordinal encoding, if the target is > 1-d
+                else:
+                    cat_encoder = OrdinalEncoder(handle_unknown="use_encoded_value", unknown_value=np.nan)
+                    cat_encoder.fit(tensor.astype(str).reshape(-1, 1))
+                tensor = cat_encoder.transform(tensor.astype(str).reshape(-1, 1)).reshape(tensor.shape)
+                cat_encoders[key] = cat_encoder
+            tensor = torch.from_numpy(tensor)
+        assert isinstance(tensor, torch.Tensor)
        if tensor.ndim != 1 or len(tensor) != history_length:
            raise ValueError(
                f"Individual `past_covariates` must be 1-d with length equal to the length of `target` (= {history_length}), "
                f"found: {key} with shape {tuple(tensor.shape)} in element at index {idx}"
            )
        task_past_covariates_list.append(tensor)
-    task_past_covariates_array = (
-        np.stack(task_past_covariates_list, axis=0)
+    task_past_covariates_tensor = (
+        torch.stack(task_past_covariates_list, dim=0)
        if task_past_covariates_list
-        else np.zeros((0, history_length), dtype=np.float32)
+        else torch.zeros((0, history_length), device=task_target.device)
    )

    # validate future_covariates (build rows in the same task_ordered_covariate_keys order)
-    task_future_covariates_list: list[np.ndarray] = []
+    task_future_covariates_list: list[torch.Tensor] = []
    for key in task_ordered_covariate_keys:
        # future values of past-only covariates are filled with NaNs
-        tensor = task_future_covariates.get(key, np.full(prediction_length, np.nan))
-        if isinstance(tensor, torch.Tensor):
-            tensor = tensor.to(torch.float32).numpy()
-        tensor = np.asarray(tensor)
-        # apply encoding to categorical variates
-        if not np.issubdtype(tensor.dtype, np.number):
-            cat_encoder = cat_encoders[key]
-            tensor = cat_encoder.transform(tensor.astype(str).reshape(-1, 1)).reshape(tensor.shape)
+        tensor = task_future_covariates.get(key, torch.full((prediction_length,), fill_value=torch.nan))
+        if isinstance(tensor, np.ndarray):
+            # apply encoding to categorical variates
+            if not np.issubdtype(tensor.dtype, np.number):
+                cat_encoder = cat_encoders[key]
+                tensor = cat_encoder.transform(tensor.astype(str).reshape(-1, 1)).reshape(tensor.shape)
+            tensor = torch.from_numpy(tensor)
+        assert isinstance(tensor, torch.Tensor)
        if tensor.ndim != 1 or len(tensor) != prediction_length:
            raise ValueError(
                f"Individual `future_covariates` must be 1-d with length equal to the {prediction_length=}, "
                f"found: {key} with shape {tuple(tensor.shape)} in element at index {idx}"
            )
        task_future_covariates_list.append(tensor)
-    task_future_covariates_array = (
-        np.stack(task_future_covariates_list, axis=0)
+    task_future_covariates_tensor = (
+        torch.stack(task_future_covariates_list, dim=0)
        if task_future_covariates_list
-        else np.zeros((0, prediction_length), dtype=np.float32)
+        else torch.zeros((0, prediction_length), device=task_target.device)
    )
    # future values of target series are filled with NaNs
-    task_future_covariates_target_padding = np.full(
-        (task_target.shape[0], prediction_length), np.nan, dtype=np.float32
+    task_future_covariates_target_padding = torch.full(
+        (task_target.shape[0], prediction_length), fill_value=torch.nan, device=task_target.device
    )

-    context = np.concatenate([task_target, task_past_covariates_array], axis=0).astype(np.float32)
-    future_covariates = np.concatenate(
-        [task_future_covariates_target_padding, task_future_covariates_array], axis=0
-    ).astype(np.float32)
+    task_context_tensor = torch.cat([task_target, task_past_covariates_tensor], dim=0).to(dtype=torch.float32)
+    task_future_covariates_tensor = torch.cat(
+        [task_future_covariates_target_padding, task_future_covariates_tensor], dim=0
+    ).to(dtype=torch.float32)
+    task_n_targets = task_target.shape[0]
+    task_n_covariates = task_past_covariates_tensor.shape[0]
+    # number of known-future covariates
+    task_n_future_covariates = len(task_future_covariates_keys)

    return PreparedTask(
-        context=context,
-        future_covariates=future_covariates,
-        n_targets=task_target.shape[0],
-        n_covariates=task_past_covariates_array.shape[0],
-        n_future_covariates=len(task_future_covariates_keys),
+        context=task_context_tensor,
+        future_covariates=task_future_covariates_tensor,
+        n_targets=task_n_targets,
+        n_covariates=task_n_covariates,
+        n_future_covariates=task_n_future_covariates,
    )


@ -217,7 +230,6 @@ def prepare_tasks(
    This function handles mode-specific preprocessing (e.g., filtering short series)
    and calls validate_and_prepare_single_dict_task for each task.
    """
-    # Import here to avoid issues with forward reference
    if isinstance(mode, str):
        mode = DatasetMode(mode)

@ -237,13 +249,13 @@ def prepare_tasks(
                raw_task = {**raw_task, "future_covariates": fixed_future_covariates}

        raw_task = cast(dict[str, TensorOrArray | Mapping[str, TensorOrArray]], raw_task)
-        prepared = validate_and_prepare_single_dict_task(raw_task, idx, prediction_length)
+        task = validate_and_prepare_single_dict_task(raw_task, idx, prediction_length)

        # Filter by minimum length (except in TEST mode)
-        if mode != DatasetMode.TEST and prepared["context"].shape[-1] < min_past + prediction_length:
+        if mode != DatasetMode.TEST and task["context"].shape[-1] < min_past + prediction_length:
            continue

-        tasks.append(prepared)
+        tasks.append(task)

    if len(tasks) == 0:
        raise ValueError(
@ -522,15 +534,8 @@ class Chronos2Dataset(IterableDataset):

    def _construct_slice(self, task_idx: int) -> tuple[torch.Tensor, torch.Tensor | None, torch.Tensor, int]:
        task = self.tasks[task_idx]
-        # Convert numpy arrays to torch tensors if needed
-        context = task["context"]
-        future_cov = task["future_covariates"]
-        if isinstance(context, np.ndarray):
-            context = torch.from_numpy(context)
-        if isinstance(future_cov, np.ndarray):
-            future_cov = torch.from_numpy(future_cov)
-        task_past_tensor = context.clone().to(torch.float32)
-        task_future_tensor = future_cov.clone().to(torch.float32)
+        task_past_tensor = task["context"].clone()
+        task_future_tensor = task["future_covariates"].clone()
        task_n_targets = task["n_targets"]
        task_n_covariates = task["n_covariates"]
        task_n_future_covariates = task["n_future_covariates"]