From b9ea2e73da13ba9f19ca8d6f608c91b679044323 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Morales?= <jmoralz92@gmail.com>
Date: Tue, 22 Oct 2024 15:59:10 -0600
Subject: [PATCH 1/6] fix(ci): increase tolerance in distributed tests

---
 nbs/src/nixtla_client.ipynb | 120 +++++++++---------------------------
 nixtla/nixtla_client.py     |   2 +-
 2 files changed, 29 insertions(+), 93 deletions(-)

diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
index f15664ea..7e524d1c 100644
--- a/nbs/src/nixtla_client.ipynb
+++ b/nbs/src/nixtla_client.ipynb
@@ -1734,31 +1734,6 @@
     "nixtla_client.validate_api_key()"
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#| hide\n",
-    "_nixtla_client = NixtlaClient(api_key=\"invalid\")\n",
-    "test_eq(_nixtla_client.validate_api_key(), False)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#| hide\n",
-    "_nixtla_client = NixtlaClient(\n",
-    "    api_key=os.environ['NIXTLA_API_KEY_CUSTOM'], \n",
-    "    base_url=os.environ['NIXTLA_BASE_URL_CUSTOM'],\n",
-    ")\n",
-    "_nixtla_client.validate_api_key()"
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -2089,49 +2064,15 @@
    "outputs": [],
    "source": [
     "#| hide\n",
-    "#test same results custom url\n",
-    "nixtla_client_custom = NixtlaClient(\n",
-    "    api_key=os.environ['NIXTLA_API_KEY_CUSTOM'], \n",
-    "    base_url=os.environ['NIXTLA_BASE_URL_CUSTOM'],\n",
-    ")\n",
-    "# forecast method\n",
+    "# test different results for different models\n",
     "fcst_kwargs = dict(\n",
-    "    df=df, \n",
-    "    h=12, \n",
-    "    level=[90, 95], \n",
-    "    add_history=True, \n",
-    "    time_col='timestamp', \n",
+    "    df=df,\n",
+    "    h=12,\n",
+    "    level=[90, 95],\n",
+    "    add_history=True,\n",
+    "    time_col='timestamp',\n",
     "    target_col='value',\n",
     ")\n",
-    "fcst_df = nixtla_client.forecast(**fcst_kwargs)\n",
-    "fcst_df_custom = nixtla_client_custom.forecast(**fcst_kwargs)\n",
-    "pd.testing.assert_frame_equal(\n",
-    "    fcst_df,\n",
-    "    fcst_df_custom,\n",
-    ")\n",
-    "# anomalies method\n",
-    "anomalies_kwargs = dict(\n",
-    "    df=df, \n",
-    "    level=99,\n",
-    "    time_col='timestamp', \n",
-    "    target_col='value',\n",
-    ")\n",
-    "anomalies_df = nixtla_client.detect_anomalies(**anomalies_kwargs)\n",
-    "anomalies_df_custom = nixtla_client_custom.detect_anomalies(**anomalies_kwargs)\n",
-    "pd.testing.assert_frame_equal(\n",
-    "    anomalies_df,\n",
-    "    anomalies_df_custom,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#| hide\n",
-    "# test different results for different models\n",
     "fcst_kwargs['model'] = 'timegpt-1'\n",
     "fcst_timegpt_1 = nixtla_client.forecast(**fcst_kwargs)\n",
     "fcst_kwargs['model'] = 'timegpt-1-long-horizon'\n",
@@ -2152,10 +2093,10 @@
     "# test different results for different models\n",
     "# cross validation\n",
     "cv_kwargs = dict(\n",
-    "    df=df, \n",
-    "    h=12, \n",
-    "    level=[90, 95], \n",
-    "    time_col='timestamp', \n",
+    "    df=df,\n",
+    "    h=12,\n",
+    "    level=[90, 95],\n",
+    "    time_col='timestamp',\n",
     "    target_col='value',\n",
     ")\n",
     "cv_kwargs['model'] = 'timegpt-1'\n",
@@ -2177,6 +2118,12 @@
     "#| hide\n",
     "# test different results for different models\n",
     "# anomalies\n",
+    "anomalies_kwargs = dict(\n",
+    "    df=df,\n",
+    "    level=99,\n",
+    "    time_col='timestamp',\n",
+    "    target_col='value',\n",
+    ")\n",
     "anomalies_kwargs['model'] = 'timegpt-1'\n",
     "anomalies_timegpt_1 = nixtla_client.detect_anomalies(**anomalies_kwargs)\n",
     "anomalies_kwargs['model'] = 'timegpt-1-long-horizon'\n",
@@ -2572,23 +2519,6 @@
     ")"
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#| hide\n",
-    "# test custom url\n",
-    "# same results\n",
-    "_timegpt_fcst_df = _nixtla_client.forecast(df=df, h=12, time_col='timestamp', target_col='value')\n",
-    "timegpt_fcst_df = nixtla_client.forecast(df=df, h=12, time_col='timestamp', target_col='value')\n",
-    "pd.testing.assert_frame_equal(\n",
-    "    _timegpt_fcst_df,\n",
-    "    timegpt_fcst_df,\n",
-    ")"
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -3060,6 +2990,8 @@
    "source": [
     "#| hide\n",
     "#| distributed\n",
+    "ATOL = 1e-3\n",
+    "\n",
     "def test_forecast(\n",
     "    df: fugue.AnyDataFrame, \n",
     "    horizon: int = 12,\n",
@@ -3147,6 +3079,7 @@
     "    pd.testing.assert_frame_equal(\n",
     "        fcst_df.sort_values([id_col, time_col]).reset_index(drop=True),\n",
     "        fcst_df_2.sort_values([id_col, time_col]).reset_index(drop=True),\n",
+    "        atol=ATOL,\n",
     "    )\n",
     "\n",
     "def test_cv_same_results_num_partitions(\n",
@@ -3177,6 +3110,7 @@
     "    pd.testing.assert_frame_equal(\n",
     "        fcst_df.sort_values([id_col, time_col]).reset_index(drop=True),\n",
     "        fcst_df_2.sort_values([id_col, time_col]).reset_index(drop=True),\n",
+    "        atol=ATOL,\n",
     "    )\n",
     "\n",
     "def test_forecast_dataframe(df: fugue.AnyDataFrame):\n",
@@ -3241,7 +3175,8 @@
     "    fcst_df_2 = fa.as_pandas(fcst_df_2)\n",
     "    equal_arrays = np.array_equal(\n",
     "        fcst_df.sort_values([id_col, time_col])['TimeGPT'].values,\n",
-    "        fcst_df_2.sort_values([id_col, time_col])['TimeGPT'].values\n",
+    "        fcst_df_2.sort_values([id_col, time_col])['TimeGPT'].values,\n",
+    "        #atol=ATOL,\n",
     "    )\n",
     "    assert not equal_arrays, 'Forecasts with and without ex vars are equal'\n",
     "\n",
@@ -3277,7 +3212,8 @@
     "    fcst_df_2 = fa.as_pandas(fcst_df_2)\n",
     "    equal_arrays = np.array_equal(\n",
     "        fcst_df.sort_values([id_col, time_col])['TimeGPT'].values,\n",
-    "        fcst_df_2.sort_values([id_col, time_col])['TimeGPT'].values\n",
+    "        fcst_df_2.sort_values([id_col, time_col])['TimeGPT'].values,\n",
+    "        #atol=ATOL,\n",
     "    )\n",
     "    assert not equal_arrays, 'Forecasts with and without ex vars are equal'\n",
     "\n",
@@ -3360,7 +3296,7 @@
     "    pd.testing.assert_frame_equal(\n",
     "        anomalies_df.sort_values([id_col, time_col]).reset_index(drop=True),\n",
     "        anomalies_df_2.sort_values([id_col, time_col]).reset_index(drop=True),\n",
-    "        atol=1e-5,\n",
+    "        atol=ATOL,\n",
     "    )\n",
     "\n",
     "def test_anomalies_diff_results_diff_models(\n",
@@ -3420,10 +3356,10 @@
     "    exp_q_cols = [f\"TimeGPT-q-{int(q * 100)}\" for q in test_qls]\n",
     "    def test_method_qls(method, **kwargs):\n",
     "        df_qls = method(\n",
-    "            df=df, \n",
-    "            h=12, \n",
+    "            df=df,\n",
+    "            h=12,\n",
     "            id_col=id_col,\n",
-    "            time_col=time_col, \n",
+    "            time_col=time_col,\n",
     "            quantiles=test_qls,\n",
     "            **kwargs\n",
     "        )\n",
diff --git a/nixtla/nixtla_client.py b/nixtla/nixtla_client.py
index 99ced843..2d11c4da 100644
--- a/nixtla/nixtla_client.py
+++ b/nixtla/nixtla_client.py
@@ -1628,7 +1628,7 @@ def plot(
             ax=ax,
         )
 
-# %% ../nbs/src/nixtla_client.ipynb 54
+# %% ../nbs/src/nixtla_client.ipynb 50
 def _forecast_wrapper(
     df: pd.DataFrame,
     client: NixtlaClient,

From f5019722c005666804293dab876c85e782d5f553 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Morales?= <jmoralz92@gmail.com>
Date: Tue, 22 Oct 2024 16:02:49 -0600
Subject: [PATCH 2/6] remove comments

---
 nbs/src/nixtla_client.ipynb | 2 --
 1 file changed, 2 deletions(-)

diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
index 7e524d1c..17b1f756 100644
--- a/nbs/src/nixtla_client.ipynb
+++ b/nbs/src/nixtla_client.ipynb
@@ -3176,7 +3176,6 @@
     "    equal_arrays = np.array_equal(\n",
     "        fcst_df.sort_values([id_col, time_col])['TimeGPT'].values,\n",
     "        fcst_df_2.sort_values([id_col, time_col])['TimeGPT'].values,\n",
-    "        #atol=ATOL,\n",
     "    )\n",
     "    assert not equal_arrays, 'Forecasts with and without ex vars are equal'\n",
     "\n",
@@ -3213,7 +3212,6 @@
     "    equal_arrays = np.array_equal(\n",
     "        fcst_df.sort_values([id_col, time_col])['TimeGPT'].values,\n",
     "        fcst_df_2.sort_values([id_col, time_col])['TimeGPT'].values,\n",
-    "        #atol=ATOL,\n",
     "    )\n",
     "    assert not equal_arrays, 'Forecasts with and without ex vars are equal'\n",
     "\n",

From 17d69b3d1fa3f3593b9b0bc28b6f1afc5a8945e2 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Morales?= <jmoralz92@gmail.com>
Date: Tue, 22 Oct 2024 16:15:57 -0600
Subject: [PATCH 3/6] set tol in historic test

---
 nbs/src/nixtla_client.ipynb | 1 +
 1 file changed, 1 insertion(+)

diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
index 17b1f756..b5857d46 100644
--- a/nbs/src/nixtla_client.ipynb
+++ b/nbs/src/nixtla_client.ipynb
@@ -2031,6 +2031,7 @@
     "    pd.testing.assert_frame_equal(\n",
     "        fcst_no_rest_df,\n",
     "        fcst_rest_df,\n",
+    "        atol=1e-4,\n",
     "    )\n",
     "    return fcst_rest_df\n",
     "\n",

From 0df77d7945a787165f346622d4d95298ca3279db Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Morales?= <jmoralz92@gmail.com>
Date: Tue, 22 Oct 2024 16:28:28 -0600
Subject: [PATCH 4/6] set rtol

---
 nbs/src/nixtla_client.ipynb | 1 +
 1 file changed, 1 insertion(+)

diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
index b5857d46..a0ece803 100644
--- a/nbs/src/nixtla_client.ipynb
+++ b/nbs/src/nixtla_client.ipynb
@@ -2032,6 +2032,7 @@
     "        fcst_no_rest_df,\n",
     "        fcst_rest_df,\n",
     "        atol=1e-4,\n",
+    "        rtol=1e-4,\n",
     "    )\n",
     "    return fcst_rest_df\n",
     "\n",

From f693e21d19bcdd2496066651171e812abf67bc07 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Morales?= <jmoralz92@gmail.com>
Date: Tue, 22 Oct 2024 16:42:04 -0600
Subject: [PATCH 5/6] plz

---
 nbs/src/nixtla_client.ipynb | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
index a0ece803..ad0b13bb 100644
--- a/nbs/src/nixtla_client.ipynb
+++ b/nbs/src/nixtla_client.ipynb
@@ -2032,7 +2032,7 @@
     "        fcst_no_rest_df,\n",
     "        fcst_rest_df,\n",
     "        atol=1e-4,\n",
-    "        rtol=1e-4,\n",
+    "        rtol=1e-3,\n",
     "    )\n",
     "    return fcst_rest_df\n",
     "\n",

From 4018744b051c30b9f9450489a15821f9e05827e1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jos=C3=A9=20Morales?= <jmoralz92@gmail.com>
Date: Tue, 22 Oct 2024 16:59:40 -0600
Subject: [PATCH 6/6] more tols

---
 nbs/docs/tutorials/12_irregular_timestamps.ipynb | 4 +++-
 nbs/src/nixtla_client.ipynb                      | 9 +++++++--
 2 files changed, 10 insertions(+), 3 deletions(-)

diff --git a/nbs/docs/tutorials/12_irregular_timestamps.ipynb b/nbs/docs/tutorials/12_irregular_timestamps.ipynb
index 88e492db..a0588425 100644
--- a/nbs/docs/tutorials/12_irregular_timestamps.ipynb
+++ b/nbs/docs/tutorials/12_irregular_timestamps.ipynb
@@ -196,7 +196,9 @@
     "    df_fed_test = pd.read_csv('https://raw.githubusercontent.com/Nixtla/transfer-learning-time-series/main/datasets/openbb/fed.csv')\n",
     "    pd.testing.assert_frame_equal(\n",
     "        nixtla_client.forecast(df_fed_test, h=12, target_col='FF', level=[90]),\n",
-    "        nixtla_client.forecast(df_fed_test, h=12, target_col='FF', freq='W', level=[90])\n",
+    "        nixtla_client.forecast(df_fed_test, h=12, target_col='FF', freq='W', level=[90]),\n",
+    "        atol=1e-4,\n",
+    "        rtol=1e-3,\n",
     "    )"
    ]
   },
diff --git a/nbs/src/nixtla_client.ipynb b/nbs/src/nixtla_client.ipynb
index ad0b13bb..5599e663 100644
--- a/nbs/src/nixtla_client.ipynb
+++ b/nbs/src/nixtla_client.ipynb
@@ -2213,7 +2213,7 @@
     "\n",
     "# test num partitions\n",
     "_ = nixtla_client.forecast(df=df_date_features, h=h, X_df=future_df, add_history=True, feature_contributions=True, num_partitions=2)\n",
-    "pd.testing.assert_frame_equal(nixtla_client.feature_contributions, shap_values_hist)"
+    "pd.testing.assert_frame_equal(nixtla_client.feature_contributions, shap_values_hist, atol=1e-4, rtol=1e-3)"
    ]
   },
   {
@@ -2266,7 +2266,12 @@
     "    fcst_cv = nixtla_client.cross_validation(df_ex_, h=12, **hyp)\n",
     "    fcst_cv = fcst_cv.sort_values(['unique_id', 'ds']).reset_index(drop=True)\n",
     "    logger.info('\\n\\nVerify difference\\n')\n",
-    "    pd.testing.assert_frame_equal(fcst_test, fcst_cv.drop(columns='cutoff'))"
+    "    pd.testing.assert_frame_equal(\n",
+    "        fcst_test,\n",
+    "        fcst_cv.drop(columns='cutoff'),\n",
+    "        atol=1e-4,\n",
+    "        rtol=1e-3,\n",
+    "    )"
    ]
   },
   {