Upload 8 files

Browse files

Files changed (8) hide show

README.md +70 -0
config.json +250 -0
model.py +254 -0
model_all.safetensors +3 -0
model_carbs.safetensors +3 -0
model_cgm.safetensors +3 -0
model_insulin.safetensors +3 -0
push.sh +18 -0

README.md ADDED Viewed

	@@ -0,0 +1,70 @@

+---
+license: apache-2.0
+tags:
+  - cgm
+  - time-series
+  - glucose-forecasting
+  - ridge-regression
+  - metabonet
+library_name: transformers
+pipeline_tag: time-series-forecasting
+---
+# Ridge multi-horizon CGM forecaster (MetaboNet)
+A `sklearn`-trained Ridge regressor (with `StandardScaler`) re-packaged as a
+`transformers`-compatible Hub model. One repo holds four feature ablations
+selectable at load time:
+- `cgm` — 24 CGM lags + `hour_sin`/`hour_cos` (26 features).
+- `insulin` — `cgm` features + 24 Insulin lags (50 features).
+- `carbs` — `cgm` features + 24 Carbs lags (50 features).
+- `all` — `cgm` features + 24 Insulin lags + 24 Carbs lags (74 features).
+History length is 24 (= 2 hours at 5-minute sampling). Output is 12 future
+CGM values (5–60 min horizons).
+## Files
+- `config.json` — `auto_map` wiring + per-ablation feature lists.
+- `model.py` — `RidgeMultiHorizonConfig` / `RidgeMultiHorizonModel`
+  (`trust_remote_code=True`).
+- `model_<ablation>.safetensors` — one per ablation, holding `scaler_mean`,
+  `scaler_scale`, `coef` (12 × F), `intercept` (12).
+## Usage
+```python
+from transformers import AutoConfig, AutoModel
+cfg = AutoConfig.from_pretrained(
+    "anonymous-4FAD/Ridge", trust_remote_code=True, ablation="cgm"
+)
+model = AutoModel.from_pretrained(
+    "anonymous-4FAD/Ridge", trust_remote_code=True, config=cfg
+)
+# Inputs match the MetaboNet benchmark.py contract:
+#   timestamps: int64 ns, shape (B, T_in)
+#   cgm/insulin/carbs: float, shape (B, T_in); only the last 24 steps are used
+preds = model.predict(timestamps, cgm, insulin, carbs)  # -> (B, 12)
+```
+The thin local wrapper in
+[`models/ridge.py`](https://github.com/njeffrie/MetaboNet-Bench/blob/main/models/ridge.py)
+exposes the same API used by `benchmark.py`.
+## Feature convention
+`CGM_t<i>` denotes the i-th sample within the last `history_length` steps,
+ordered oldest -> newest (`CGM_t0` is the oldest of the 24, `CGM_t23` is the
+newest). The same convention applies to `Insulin_t<i>` and `Carbs_t<i>`.
+`hour_sin` / `hour_cos` are derived from the most recent input timestamp.
+## Provenance
+Trained via
+[`other_models/results/train_ridge.py`](https://github.com/njeffrie/MetaboNet-Bench/blob/main/other_models/results/train_ridge.py)
+on the public MetaboNet train split. The `safetensors` checkpoints are produced
+by [`scripts/build_other_models_hub.py`](https://github.com/njeffrie/MetaboNet-Bench/blob/main/scripts/build_other_models_hub.py)
+from the original sklearn pickles.

config.json ADDED Viewed

	@@ -0,0 +1,250 @@

+{
+  "model_type": "ridge_multihorizon",
+  "auto_map": {
+    "AutoConfig": "model.RidgeMultiHorizonConfig",
+    "AutoModel": "model.RidgeMultiHorizonModel"
+  },
+  "architectures": [
+    "RidgeMultiHorizonModel"
+  ],
+  "ablation": "all",
+  "ablations": [
+    "cgm",
+    "insulin",
+    "carbs",
+    "all"
+  ],
+  "history_length": 24,
+  "horizon_length": 12,
+  "feature_names_by_ablation": {
+    "cgm": [
+      "CGM_t0",
+      "CGM_t1",
+      "CGM_t2",
+      "CGM_t3",
+      "CGM_t4",
+      "CGM_t5",
+      "CGM_t6",
+      "CGM_t7",
+      "CGM_t8",
+      "CGM_t9",
+      "CGM_t10",
+      "CGM_t11",
+      "CGM_t12",
+      "CGM_t13",
+      "CGM_t14",
+      "CGM_t15",
+      "CGM_t16",
+      "CGM_t17",
+      "CGM_t18",
+      "CGM_t19",
+      "CGM_t20",
+      "CGM_t21",
+      "CGM_t22",
+      "CGM_t23",
+      "hour_sin",
+      "hour_cos"
+    ],
+    "insulin": [
+      "CGM_t0",
+      "CGM_t1",
+      "CGM_t2",
+      "CGM_t3",
+      "CGM_t4",
+      "CGM_t5",
+      "CGM_t6",
+      "CGM_t7",
+      "CGM_t8",
+      "CGM_t9",
+      "CGM_t10",
+      "CGM_t11",
+      "CGM_t12",
+      "CGM_t13",
+      "CGM_t14",
+      "CGM_t15",
+      "CGM_t16",
+      "CGM_t17",
+      "CGM_t18",
+      "CGM_t19",
+      "CGM_t20",
+      "CGM_t21",
+      "CGM_t22",
+      "CGM_t23",
+      "Insulin_t0",
+      "Insulin_t1",
+      "Insulin_t2",
+      "Insulin_t3",
+      "Insulin_t4",
+      "Insulin_t5",
+      "Insulin_t6",
+      "Insulin_t7",
+      "Insulin_t8",
+      "Insulin_t9",
+      "Insulin_t10",
+      "Insulin_t11",
+      "Insulin_t12",
+      "Insulin_t13",
+      "Insulin_t14",
+      "Insulin_t15",
+      "Insulin_t16",
+      "Insulin_t17",
+      "Insulin_t18",
+      "Insulin_t19",
+      "Insulin_t20",
+      "Insulin_t21",
+      "Insulin_t22",
+      "Insulin_t23",
+      "hour_sin",
+      "hour_cos"
+    ],
+    "carbs": [
+      "CGM_t0",
+      "CGM_t1",
+      "CGM_t2",
+      "CGM_t3",
+      "CGM_t4",
+      "CGM_t5",
+      "CGM_t6",
+      "CGM_t7",
+      "CGM_t8",
+      "CGM_t9",
+      "CGM_t10",
+      "CGM_t11",
+      "CGM_t12",
+      "CGM_t13",
+      "CGM_t14",
+      "CGM_t15",
+      "CGM_t16",
+      "CGM_t17",
+      "CGM_t18",
+      "CGM_t19",
+      "CGM_t20",
+      "CGM_t21",
+      "CGM_t22",
+      "CGM_t23",
+      "Carbs_t0",
+      "Carbs_t1",
+      "Carbs_t2",
+      "Carbs_t3",
+      "Carbs_t4",
+      "Carbs_t5",
+      "Carbs_t6",
+      "Carbs_t7",
+      "Carbs_t8",
+      "Carbs_t9",
+      "Carbs_t10",
+      "Carbs_t11",
+      "Carbs_t12",
+      "Carbs_t13",
+      "Carbs_t14",
+      "Carbs_t15",
+      "Carbs_t16",
+      "Carbs_t17",
+      "Carbs_t18",
+      "Carbs_t19",
+      "Carbs_t20",
+      "Carbs_t21",
+      "Carbs_t22",
+      "Carbs_t23",
+      "hour_sin",
+      "hour_cos"
+    ],
+    "all": [
+      "CGM_t0",
+      "CGM_t1",
+      "CGM_t2",
+      "CGM_t3",
+      "CGM_t4",
+      "CGM_t5",
+      "CGM_t6",
+      "CGM_t7",
+      "CGM_t8",
+      "CGM_t9",
+      "CGM_t10",
+      "CGM_t11",
+      "CGM_t12",
+      "CGM_t13",
+      "CGM_t14",
+      "CGM_t15",
+      "CGM_t16",
+      "CGM_t17",
+      "CGM_t18",
+      "CGM_t19",
+      "CGM_t20",
+      "CGM_t21",
+      "CGM_t22",
+      "CGM_t23",
+      "Insulin_t0",
+      "Insulin_t1",
+      "Insulin_t2",
+      "Insulin_t3",
+      "Insulin_t4",
+      "Insulin_t5",
+      "Insulin_t6",
+      "Insulin_t7",
+      "Insulin_t8",
+      "Insulin_t9",
+      "Insulin_t10",
+      "Insulin_t11",
+      "Insulin_t12",
+      "Insulin_t13",
+      "Insulin_t14",
+      "Insulin_t15",
+      "Insulin_t16",
+      "Insulin_t17",
+      "Insulin_t18",
+      "Insulin_t19",
+      "Insulin_t20",
+      "Insulin_t21",
+      "Insulin_t22",
+      "Insulin_t23",
+      "Carbs_t0",
+      "Carbs_t1",
+      "Carbs_t2",
+      "Carbs_t3",
+      "Carbs_t4",
+      "Carbs_t5",
+      "Carbs_t6",
+      "Carbs_t7",
+      "Carbs_t8",
+      "Carbs_t9",
+      "Carbs_t10",
+      "Carbs_t11",
+      "Carbs_t12",
+      "Carbs_t13",
+      "Carbs_t14",
+      "Carbs_t15",
+      "Carbs_t16",
+      "Carbs_t17",
+      "Carbs_t18",
+      "Carbs_t19",
+      "Carbs_t20",
+      "Carbs_t21",
+      "Carbs_t22",
+      "Carbs_t23",
+      "hour_sin",
+      "hour_cos"
+    ]
+  },
+  "n_features_by_ablation": {
+    "cgm": 26,
+    "insulin": 50,
+    "carbs": 50,
+    "all": 74
+  },
+  "target_names": [
+    "CGM_t+1",
+    "CGM_t+2",
+    "CGM_t+3",
+    "CGM_t+4",
+    "CGM_t+5",
+    "CGM_t+6",
+    "CGM_t+7",
+    "CGM_t+8",
+    "CGM_t+9",
+    "CGM_t+10",
+    "CGM_t+11",
+    "CGM_t+12"
+  ],
+  "transformers_version": "4.54.0"
+}

model.py ADDED Viewed

	@@ -0,0 +1,254 @@

+"""Ridge multi-horizon CGM forecaster, packaged for the HF Hub.
+One repo holds four feature ablations (``cgm``, ``insulin``, ``carbs``, ``all``)
+as separate ``model_<ablation>.safetensors`` files. The active ablation is
+selected at load time via the ``ablation=`` kwarg passed through ``AutoConfig``
+or ``AutoModel`` ``from_pretrained``.
+Usage::
+    from transformers import AutoConfig, AutoModel
+    cfg = AutoConfig.from_pretrained(
+        "anonymous-4FAD/Ridge", trust_remote_code=True, ablation="cgm")
+    model = AutoModel.from_pretrained(
+        "anonymous-4FAD/Ridge", trust_remote_code=True, config=cfg)
+    preds = model.predict(timestamps_ns, cgm, insulin, carbs)  # (B, 12)
+"""
+from __future__ import annotations
+import math
+import os
+from typing import Optional
+import numpy as np
+import torch
+import torch.nn as nn
+from huggingface_hub import hf_hub_download
+from safetensors.torch import load_file
+from transformers import PretrainedConfig, PreTrainedModel
+_HUB_DOWNLOAD_KWARGS = (
+    "cache_dir",
+    "force_download",
+    "local_files_only",
+    "proxies",
+    "revision",
+    "subfolder",
+    "token",
+)
+class RidgeMultiHorizonConfig(PretrainedConfig):
+    """Config for the multi-horizon Ridge forecaster.
+    The same repo serves four ablations (``cgm``, ``insulin``, ``carbs``,
+    ``all``); the currently active one is ``self.ablation``.
+    """
+    model_type = "ridge_multihorizon"
+    def __init__(
+        self,
+        ablation: str = "all",
+        ablations: Optional[list] = None,
+        history_length: int = 24,
+        horizon_length: int = 12,
+        feature_names_by_ablation: Optional[dict] = None,
+        n_features_by_ablation: Optional[dict] = None,
+        target_names: Optional[list] = None,
+        **kwargs,
+    ):
+        if ablations is None:
+            ablations = ["cgm", "insulin", "carbs", "all"]
+        if ablation not in ablations:
+            raise ValueError(
+                f"ablation must be one of {ablations}, got {ablation!r}"
+            )
+        self.ablation = ablation
+        self.ablations = list(ablations)
+        self.history_length = int(history_length)
+        self.horizon_length = int(horizon_length)
+        self.feature_names_by_ablation = feature_names_by_ablation or {}
+        self.n_features_by_ablation = n_features_by_ablation or {}
+        self.target_names = list(target_names or [])
+        super().__init__(**kwargs)
+    @property
+    def n_features(self) -> int:
+        if self.n_features_by_ablation:
+            return int(self.n_features_by_ablation[self.ablation])
+        return len(self.feature_names_by_ablation[self.ablation])
+    @property
+    def feature_names(self) -> list:
+        return list(self.feature_names_by_ablation[self.ablation])
+class RidgeMultiHorizonModel(PreTrainedModel):
+    """Multi-output Ridge regressor over standardized tabular features.
+    Holds only buffers (``scaler_mean``, ``scaler_scale``, ``coef``,
+    ``intercept``); there are no trainable parameters.
+    """
+    config_class = RidgeMultiHorizonConfig
+    main_input_name = "features"
+    _tied_weights_keys: dict = None
+    _no_split_modules: list = []
+    def __init__(self, config: RidgeMultiHorizonConfig):
+        super().__init__(config)
+        n_feat = config.n_features
+        n_horiz = config.horizon_length
+        self.register_buffer("scaler_mean", torch.zeros(n_feat))
+        self.register_buffer("scaler_scale", torch.ones(n_feat))
+        self.register_buffer("coef", torch.zeros(n_horiz, n_feat))
+        self.register_buffer("intercept", torch.zeros(n_horiz))
+    def _init_weights(self, module):
+        # No trainable parameters; values come from safetensors.
+        pass
+    def forward(self, features: torch.Tensor) -> torch.Tensor:
+        x = (features.to(self.coef.dtype) - self.scaler_mean) / self.scaler_scale
+        return x @ self.coef.T + self.intercept
+    @classmethod
+    def from_pretrained(
+        cls,
+        pretrained_model_name_or_path,
+        *model_args,
+        config=None,
+        ablation: Optional[str] = None,
+        **kwargs,
+    ):
+        # Drop transformers-internal markers we don't need to act on.
+        kwargs.pop("trust_remote_code", None)
+        kwargs.pop("_from_auto", None)
+        kwargs.pop("_commit_hash", None)
+        hub_kwargs = {k: kwargs.pop(k) for k in _HUB_DOWNLOAD_KWARGS if k in kwargs}
+        if config is None:
+            config_kwargs = dict(hub_kwargs)
+            if ablation is not None:
+                config_kwargs["ablation"] = ablation
+            config = RidgeMultiHorizonConfig.from_pretrained(
+                pretrained_model_name_or_path, **config_kwargs
+            )
+        elif ablation is not None:
+            config.ablation = ablation
+        model = cls(config)
+        weights_filename = f"model_{config.ablation}.safetensors"
+        if os.path.isdir(str(pretrained_model_name_or_path)):
+            weights_path = os.path.join(
+                str(pretrained_model_name_or_path), weights_filename)
+            if not os.path.isfile(weights_path):
+                raise FileNotFoundError(
+                    f"Expected {weights_filename} in {pretrained_model_name_or_path}"
+                )
+        else:
+            weights_path = hf_hub_download(
+                repo_id=str(pretrained_model_name_or_path),
+                filename=weights_filename,
+                **hub_kwargs,
+            )
+        state = load_file(weights_path)
+        missing, unexpected = model.load_state_dict(state, strict=False)
+        if missing:
+            raise RuntimeError(
+                f"{weights_filename} is missing buffers required by the model: {missing}"
+            )
+        if unexpected:
+            # Not fatal, but worth surfacing in case a checkpoint has stale keys.
+            print(
+                f"RidgeMultiHorizonModel: ignoring unexpected keys in "
+                f"{weights_filename}: {unexpected}"
+            )
+        model.eval()
+        return model
+    @torch.no_grad()
+    def predict(self, timestamps, cgm, insulin, carbs) -> np.ndarray:
+        """Run inference for a benchmark.py-style batch.
+        Args:
+            timestamps: int64 ns timestamps, shape ``(B, T_in)``.
+            cgm: float CGM values, shape ``(B, T_in)``.
+            insulin: float insulin values, shape ``(B, T_in)`` (used only if
+                the active ablation requires Insulin features).
+            carbs: float carb values, shape ``(B, T_in)`` (used only if the
+                active ablation requires Carbs features).
+        Returns:
+            ``(B, horizon_length)`` numpy array of predicted CGM values.
+        """
+        features = _build_tabular_features(
+            timestamps=np.asarray(timestamps),
+            cgm=np.asarray(cgm, dtype=np.float64),
+            insulin=np.asarray(insulin, dtype=np.float64),
+            carbs=np.asarray(carbs, dtype=np.float64),
+            feature_names=self.config.feature_names,
+            history_length=self.config.history_length,
+        )
+        device = self.coef.device
+        x = torch.as_tensor(features, dtype=self.coef.dtype, device=device)
+        out = self.forward(x)
+        return out.detach().cpu().numpy()
+def _build_tabular_features(
+    *,
+    timestamps: np.ndarray,
+    cgm: np.ndarray,
+    insulin: np.ndarray,
+    carbs: np.ndarray,
+    feature_names: list,
+    history_length: int,
+) -> np.ndarray:
+    """Assemble a (B, F) feature matrix in the order given by ``feature_names``.
+    Convention: ``CGM_t<i>`` means the i-th *most recent* sample within the
+    last ``history_length`` steps, i.e. ``CGM_t0`` = oldest in the window,
+    ``CGM_t<history_length-1>`` = newest. Same convention applies to
+    ``Insulin_t<i>`` / ``Carbs_t<i>``. ``hour_sin`` / ``hour_cos`` are derived
+    from the most recent input timestamp (UTC hour-of-day).
+    """
+    if cgm.shape[-1] < history_length:
+        raise ValueError(
+            f"Need at least {history_length} CGM samples, got {cgm.shape[-1]}"
+        )
+    cgm_h = cgm[..., -history_length:]
+    insulin_h = insulin[..., -history_length:]
+    carbs_h = carbs[..., -history_length:]
+    # Hour-of-day from the most recent input timestamp (ns since epoch).
+    last_ts = np.asarray(timestamps)[..., -1].astype(np.int64)
+    hours = (last_ts // 3_600_000_000_000) % 24
+    hour_sin = np.sin(2.0 * math.pi * hours / 24.0)
+    hour_cos = np.cos(2.0 * math.pi * hours / 24.0)
+    columns = []
+    for name in feature_names:
+        if name.startswith("CGM_t"):
+            i = int(name.split("_t", 1)[1])
+            columns.append(cgm_h[..., i])
+        elif name.startswith("Insulin_t"):
+            i = int(name.split("_t", 1)[1])
+            columns.append(insulin_h[..., i])
+        elif name.startswith("Carbs_t"):
+            i = int(name.split("_t", 1)[1])
+            columns.append(carbs_h[..., i])
+        elif name == "hour_sin":
+            columns.append(hour_sin)
+        elif name == "hour_cos":
+            columns.append(hour_cos)
+        else:
+            raise ValueError(f"Unknown feature column: {name!r}")
+    return np.stack(columns, axis=-1).astype(np.float32)

model_all.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb1cc1ecc7a8d58993966a9e4f6b44e80ec48b6b130a3370865ccd9120af4903
+size 4480

model_carbs.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7f2aa37a10c6548161e19f3cf3ec890f32f302a8144b9255485eacde03c01fb8
+size 3136

model_cgm.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a2a839117a4ad2b23b19d2d3a2cb2b676ac01a2fa42804a72e5ca629c64812f3
+size 1792

model_insulin.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:73669bf02fe503007004f75bcc7ff94c84ebebb6472ec6163e32fa4e51579d52
+size 3136

push.sh ADDED Viewed

	@@ -0,0 +1,18 @@

+#!/usr/bin/env bash
+# Upload hub/ridge to the Hugging Face Hub.
+# Run from anywhere; the script resolves its own location.
+#
+# Override the destination repo via the REPO env var (default:
+# anonymous-4FAD/Ridge). Extra args are forwarded to ``huggingface-cli upload``.
+#
+# Requires:
+#   - huggingface-cli installed (it ships with huggingface_hub).
+#   - You are logged in: ``huggingface-cli login``.
+set -euo pipefail
+HERE="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+REPO="${REPO:-anonymous-4FAD/Ridge}"
+echo "Uploading ${HERE} -> ${REPO}"
+huggingface-cli upload "$REPO" "$HERE" . --repo-type model "$@"