Nixtla · elephaint · Oct 15, 2024 · Sep 10, 2024 · Sep 10, 2024 · Sep 13, 2024
diff --git a/nbs/docs/capabilities/forecast/07_finetuning.ipynb b/nbs/docs/capabilities/forecast/07_finetuning.ipynb
@@ -55,20 +55,7 @@
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/markdown": [
-       "[![](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/Nixtla/nixtla/blob/main/nbs/docs/capabilities/forecast/07_finetuning.ipynb)"
-      ],
-      "text/plain": [
-       "<IPython.core.display.Markdown object>"
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    }
-   ],
+   "outputs": [],
    "source": [
     "#| echo: false\n",
     "if not IN_COLAB:\n",
@@ -124,18 +111,7 @@
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "INFO:nixtla.nixtla_client:Validating inputs...\n",
-      "INFO:nixtla.nixtla_client:Preprocessing dataframes...\n",
-      "INFO:nixtla.nixtla_client:Inferred freq: MS\n",
-      "INFO:nixtla.nixtla_client:Calling Forecast Endpoint...\n"
-     ]
-    }
-   ],
+   "outputs": [],
    "source": [
     "# Read data\n",
     "df = pd.read_csv(\"https://raw.githubusercontent.com/Nixtla/transfer-learning-time-series/main/datasets/air_passengers.csv\")\n",
@@ -166,6 +142,35 @@
     "> By default, `timegpt-1` is used. Please see [this tutorial](https://docs.nixtla.io/docs/tutorials-long_horizon_forecasting) on how and when to use `timegpt-1-long-horizon`."
    ]
   },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "By default, only the last layer of the model is finetuned. We can finetune more layers using `finetune_depth` parameter. "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Read data\n",
+    "df = pd.read_csv(\"https://raw.githubusercontent.com/Nixtla/transfer-learning-time-series/main/datasets/air_passengers.csv\")\n",
+    "\n",
+    "# Forecast with fine-tuning.\n",
+    "# Here, we fine-tune for 5 steps\n",
+    "# and we finetune more than just the last layer\n",
+    "forecast_df = nixtla_client.forecast(\n",
+    "    df=df,\n",
+    "    h=12,\n",
+    "    finetune_steps=5,\n",
+    "    finetune_depth=2,\n",
+    "    time_col='timestamp',\n",
+    "    target_col=\"value\"\n",
+    ")"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},

diff --git a/nbs/docs/tutorials/06_finetuning.ipynb b/nbs/docs/tutorials/06_finetuning.ipynb
diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
@@ -169,6 +169,7 @@
     "#| exporti\n",
     "_Loss = Literal[\"default\", \"mae\", \"mse\", \"rmse\", \"mape\", \"smape\"]\n",
     "_Model = Literal[\"azureai\", \"timegpt-1\", \"timegpt-1-long-horizon\"]\n",
+    "_Finetune_Depth = Literal[1, 2, 3, 4, 5]\n",
     "\n",
     "_date_features_by_freq = {\n",
     "    # Daily frequencies\n",
@@ -913,6 +914,7 @@
     "        level: Optional[List[Union[int, float]]] = None,\n",
     "        quantiles: Optional[List[float]] = None,\n",
     "        finetune_steps: NonNegativeInt = 0,\n",
+    "        finetune_depth: _Finetune_Depth = 1,\n",
     "        finetune_loss: _Loss = 'default',\n",
     "        clean_ex_first: bool = True,\n",
     "        validate_api_key: bool = False,\n",
@@ -964,6 +966,9 @@
     "        finetune_steps : int (default=0)\n",
     "            Number of steps used to finetune learning TimeGPT in the\n",
     "            new data.\n",
+    "        finetune_depth: int (default=1)\n",
+    "            Depth of finetuning, on a scale from 1 to 5. 1 means only the last layer is finetuned\n",
+    "            and 5 means the whole model if finetuned.\n",
     "        finetune_loss : str (default='default')\n",
     "            Loss function to use for finetuning. Options are: `default`, `mae`, `mse`, `rmse`, `mape`, and `smape`.\n",
     "        clean_ex_first : bool (default=True)\n",
@@ -1013,6 +1018,7 @@
     "                level=level,\n",
     "                quantiles=quantiles,\n",
     "                finetune_steps=finetune_steps,\n",
+    "                finetune_depth=finetune_depth,\n",
     "                finetune_loss=finetune_loss,\n",
     "                clean_ex_first=clean_ex_first,\n",
     "                validate_api_key=validate_api_key,\n",
@@ -1099,6 +1105,7 @@
     "            'clean_ex_first': clean_ex_first,\n",
     "            'level': level,\n",
     "            'finetune_steps': finetune_steps,\n",
+    "            'finetune_depth': finetune_depth,\n",
     "            'finetune_loss': finetune_loss,\n",
     "            'feature_contributions': feature_contributions and X is not None,\n",
     "        }\n",
@@ -1331,6 +1338,7 @@
     "        n_windows: PositiveInt = 1,\n",
     "        step_size: Optional[PositiveInt] = None,\n",
     "        finetune_steps: NonNegativeInt = 0,\n",
+    "        finetune_depth: _Finetune_Depth = 1,\n",
     "        finetune_loss: str = 'default',\n",
     "        clean_ex_first: bool = True,\n",
     "        date_features: Union[bool, List[str]] = False,\n",
@@ -1383,6 +1391,9 @@
     "        finetune_steps : int (default=0)\n",
     "            Number of steps used to finetune TimeGPT in the\n",
     "            new data.\n",
+    "        finetune_depth: int (default=1)\n",
+    "            Depth of finetuning, on a scale from 1 to 5. 1 means only the last layer is finetuned\n",
+    "            and 5 means the whole model if finetuned.\n",
     "        finetune_loss : str (default='default')\n",
     "            Loss function to use for finetuning. Options are: `default`, `mae`, `mse`, `rmse`, `mape`, and `smape`.\n",
     "        clean_ex_first : bool (default=True)\n",
@@ -1426,6 +1437,7 @@
     "                step_size=step_size,\n",
     "                validate_api_key=validate_api_key,\n",
     "                finetune_steps=finetune_steps,\n",
+    "                finetune_depth=finetune_depth,\n",
     "                finetune_loss=finetune_loss,\n",
     "                clean_ex_first=clean_ex_first,\n",
     "                date_features=date_features,\n",
@@ -1508,6 +1520,7 @@
     "            'clean_ex_first': clean_ex_first,\n",
     "            'level': level,\n",
     "            'finetune_steps': finetune_steps,\n",
+    "            'finetune_depth': finetune_depth,\n",
     "            'finetune_loss': finetune_loss,\n",
     "        }\n",
     "        with httpx.Client(**self._client_kwargs) as client:\n",
@@ -2618,6 +2631,7 @@
     "    level: Optional[List[Union[int, float]]],\n",
     "    quantiles: Optional[List[float]],\n",
     "    finetune_steps: NonNegativeInt,\n",
+    "    finetune_depth: _Finetune_Depth,\n",
     "    finetune_loss: _Loss,\n",
     "    clean_ex_first: bool,\n",
     "    validate_api_key: bool,\n",
@@ -2645,6 +2659,7 @@
     "        level=level,\n",
     "        quantiles=quantiles,\n",
     "        finetune_steps=finetune_steps,\n",
+    "        finetune_depth=finetune_depth,\n",
     "        finetune_loss=finetune_loss,\n",
     "        clean_ex_first=clean_ex_first,\n",
     "        validate_api_key=validate_api_key,\n",
@@ -2700,6 +2715,7 @@
     "    n_windows: PositiveInt,\n",
     "    step_size: Optional[PositiveInt],\n",
     "    finetune_steps: NonNegativeInt,\n",
+    "    finetune_depth: _Finetune_Depth,\n",
     "    finetune_loss: str,\n",
     "    clean_ex_first: bool,\n",
     "    date_features: Union[bool, List[str]],\n",
@@ -2720,6 +2736,7 @@
     "        n_windows=n_windows,\n",
     "        step_size=step_size,\n",
     "        finetune_steps=finetune_steps,\n",
+    "        finetune_depth=finetune_depth,\n",
     "        finetune_loss=finetune_loss,\n",
     "        clean_ex_first=clean_ex_first,\n",
     "        date_features=date_features,\n",
@@ -2806,6 +2823,7 @@
     "    level: Optional[List[Union[int, float]]],\n",
     "    quantiles: Optional[List[float]],\n",
     "    finetune_steps: NonNegativeInt,\n",
+    "    finetune_depth: _Finetune_Depth,\n",
     "    finetune_loss: _Loss,\n",
     "    clean_ex_first: bool,\n",
     "    validate_api_key: bool,\n",
@@ -2861,6 +2879,7 @@
     "            level=level,\n",
     "            quantiles=quantiles,\n",
     "            finetune_steps=finetune_steps,\n",
+    "            finetune_depth=finetune_depth,\n",
     "            finetune_loss=finetune_loss,\n",
     "            clean_ex_first=clean_ex_first,\n",
     "            validate_api_key=validate_api_key,\n",
@@ -2942,6 +2961,7 @@
     "    n_windows: PositiveInt,\n",
     "    step_size: Optional[PositiveInt],\n",
     "    finetune_steps: NonNegativeInt,\n",
+    "    finetune_depth: _Finetune_Depth,\n",
     "    finetune_loss: _Loss,\n",
     "    clean_ex_first: bool,\n",
     "    date_features: Union[bool, List[Union[str, Callable]]],\n",
@@ -2978,6 +2998,7 @@
     "            n_windows=n_windows,\n",
     "            step_size=step_size,\n",
     "            finetune_steps=finetune_steps,\n",
+    "            finetune_depth=finetune_depth,\n",
     "            finetune_loss=finetune_loss,\n",
     "            clean_ex_first=clean_ex_first,\n",
     "            date_features=date_features,\n",

diff --git a/nixtla/nixtla_client.py b/nixtla/nixtla_client.py
@@ -98,6 +98,7 @@
 # %% ../nbs/src/nixtla_client.ipynb 7
 _Loss = Literal["default", "mae", "mse", "rmse", "mape", "smape"]
 _Model = Literal["azureai", "timegpt-1", "timegpt-1-long-horizon"]
+_Finetune_Depth = Literal[1, 2, 3, 4, 5]
 
 _date_features_by_freq = {
     # Daily frequencies
@@ -847,6 +848,7 @@ def forecast(
         level: Optional[List[Union[int, float]]] = None,
         quantiles: Optional[List[float]] = None,
         finetune_steps: NonNegativeInt = 0,
+        finetune_depth: _Finetune_Depth = 1,
         finetune_loss: _Loss = "default",
         clean_ex_first: bool = True,
         validate_api_key: bool = False,
@@ -898,6 +900,9 @@ def forecast(
         finetune_steps : int (default=0)
             Number of steps used to finetune learning TimeGPT in the
             new data.
+        finetune_depth: int (default=1)
+            Depth of finetuning, on a scale from 1 to 5. 1 means only the last layer is finetuned
+            and 5 means the whole model if finetuned.
         finetune_loss : str (default='default')
             Loss function to use for finetuning. Options are: `default`, `mae`, `mse`, `rmse`, `mape`, and `smape`.
         clean_ex_first : bool (default=True)
@@ -947,6 +952,7 @@ def forecast(
                 level=level,
                 quantiles=quantiles,
                 finetune_steps=finetune_steps,
+                finetune_depth=finetune_depth,
                 finetune_loss=finetune_loss,
                 clean_ex_first=clean_ex_first,
                 validate_api_key=validate_api_key,
@@ -1035,6 +1041,7 @@ def forecast(
             "clean_ex_first": clean_ex_first,
             "level": level,
             "finetune_steps": finetune_steps,
+            "finetune_depth": finetune_depth,
             "finetune_loss": finetune_loss,
             "feature_contributions": feature_contributions and X is not None,
         }
@@ -1283,6 +1290,7 @@ def cross_validation(
         n_windows: PositiveInt = 1,
         step_size: Optional[PositiveInt] = None,
         finetune_steps: NonNegativeInt = 0,
+        finetune_depth: _Finetune_Depth = 1,
         finetune_loss: str = "default",
         clean_ex_first: bool = True,
         date_features: Union[bool, List[str]] = False,
@@ -1335,6 +1343,9 @@ def cross_validation(
         finetune_steps : int (default=0)
             Number of steps used to finetune TimeGPT in the
             new data.
+        finetune_depth: int (default=1)
+            Depth of finetuning, on a scale from 1 to 5. 1 means only the last layer is finetuned
+            and 5 means the whole model if finetuned.
         finetune_loss : str (default='default')
             Loss function to use for finetuning. Options are: `default`, `mae`, `mse`, `rmse`, `mape`, and `smape`.
         clean_ex_first : bool (default=True)
@@ -1378,6 +1389,7 @@ def cross_validation(
                 step_size=step_size,
                 validate_api_key=validate_api_key,
                 finetune_steps=finetune_steps,
+                finetune_depth=finetune_depth,
                 finetune_loss=finetune_loss,
                 clean_ex_first=clean_ex_first,
                 date_features=date_features,
@@ -1460,6 +1472,7 @@ def cross_validation(
             "clean_ex_first": clean_ex_first,
             "level": level,
             "finetune_steps": finetune_steps,
+            "finetune_depth": finetune_depth,
             "finetune_loss": finetune_loss,
         }
         with httpx.Client(**self._client_kwargs) as client:
@@ -1618,6 +1631,7 @@ def _forecast_wrapper(
     level: Optional[List[Union[int, float]]],
     quantiles: Optional[List[float]],
     finetune_steps: NonNegativeInt,
+    finetune_depth: _Finetune_Depth,
     finetune_loss: _Loss,
     clean_ex_first: bool,
     validate_api_key: bool,
@@ -1645,6 +1659,7 @@ def _forecast_wrapper(
         level=level,
         quantiles=quantiles,
         finetune_steps=finetune_steps,
+        finetune_depth=finetune_depth,
         finetune_loss=finetune_loss,
         clean_ex_first=clean_ex_first,
         validate_api_key=validate_api_key,
@@ -1702,6 +1717,7 @@ def _cross_validation_wrapper(
     n_windows: PositiveInt,
     step_size: Optional[PositiveInt],
     finetune_steps: NonNegativeInt,
+    finetune_depth: _Finetune_Depth,
     finetune_loss: str,
     clean_ex_first: bool,
     date_features: Union[bool, List[str]],
@@ -1722,6 +1738,7 @@ def _cross_validation_wrapper(
         n_windows=n_windows,
         step_size=step_size,
         finetune_steps=finetune_steps,
+        finetune_depth=finetune_depth,
         finetune_loss=finetune_loss,
         clean_ex_first=clean_ex_first,
         date_features=date_features,
@@ -1811,6 +1828,7 @@ def _distributed_forecast(
     level: Optional[List[Union[int, float]]],
     quantiles: Optional[List[float]],
     finetune_steps: NonNegativeInt,
+    finetune_depth: _Finetune_Depth,
     finetune_loss: _Loss,
     clean_ex_first: bool,
     validate_api_key: bool,
@@ -1867,6 +1885,7 @@ def format_X_df(
             level=level,
             quantiles=quantiles,
             finetune_steps=finetune_steps,
+            finetune_depth=finetune_depth,
             finetune_loss=finetune_loss,
             clean_ex_first=clean_ex_first,
             validate_api_key=validate_api_key,
@@ -1950,6 +1969,7 @@ def _distributed_cross_validation(
     n_windows: PositiveInt,
     step_size: Optional[PositiveInt],
     finetune_steps: NonNegativeInt,
+    finetune_depth: _Finetune_Depth,
     finetune_loss: _Loss,
     clean_ex_first: bool,
     date_features: Union[bool, List[Union[str, Callable]]],
@@ -1986,6 +2006,7 @@ def _distributed_cross_validation(
             n_windows=n_windows,
             step_size=step_size,
             finetune_steps=finetune_steps,
+            finetune_depth=finetune_depth,
             finetune_loss=finetune_loss,
             clean_ex_first=clean_ex_first,
             date_features=date_features,