From f043a547db02ecb66a8c0d389d3543f567eebb2b Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Fri, 10 Feb 2023 11:32:22 +0300 Subject: [PATCH 1/8] Fix bug in new NNs with forecasting interval --- etna/models/base.py | 3 +- .../test_inference/test_forecast.py | 69 ++++++++++--------- 2 files changed, 37 insertions(+), 35 deletions(-) diff --git a/etna/models/base.py b/etna/models/base.py index dccd4ca3f..cfc1cb7a7 100644 --- a/etna/models/base.py +++ b/etna/models/base.py @@ -629,7 +629,8 @@ def forecast(self, ts: "TSDataset", prediction_size: int) -> "TSDataset": dropna=False, ) predictions = self.raw_predict(test_dataset) - future_ts = ts.tsdataset_idx_slice(start_idx=self.encoder_length, end_idx=self.encoder_length + prediction_size) + end_idx = len(ts.index) + future_ts = ts.tsdataset_idx_slice(start_idx=end_idx - prediction_size, end_idx=end_idx) for (segment, feature_nm), value in predictions.items(): # we don't want to change dtype after assignment, but there can happen cast to float32 future_ts.df.loc[:, pd.IndexSlice[segment, feature_nm]] = value[:prediction_size, :].astype(np.float64) diff --git a/tests/test_models/test_inference/test_forecast.py b/tests/test_models/test_inference/test_forecast.py index 85cf65b3e..0a7e890be 100644 --- a/tests/test_models/test_inference/test_forecast.py +++ b/tests/test_models/test_inference/test_forecast.py @@ -85,21 +85,6 @@ def _test_forecast_in_sample_full_no_target(ts, model, transforms): def test_forecast_in_sample_full_no_target(self, model, transforms, example_tsds): self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) - @to_be_fixed(raises=AssertionError) - # Looks like a problem of current implementation of NNs - @pytest.mark.parametrize( - "model, transforms", - [ - (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), - ( - MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), - [LagTransform(in_column="target", lags=[5, 6])], - ), - ], - ) - def test_forecast_in_sample_full_no_target_failed_assertion_error(self, model, transforms, example_tsds): - self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) - @pytest.mark.parametrize( "model, transforms", [ @@ -126,6 +111,21 @@ def test_forecast_in_sample_full_no_target_failed_not_enough_context(self, model with pytest.raises(ValueError, match="Given context isn't big enough"): self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) + @to_be_fixed(raises=AssertionError) + # Looks like a problem of current implementation of NNs + @pytest.mark.parametrize( + "model, transforms", + [ + (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), + ( + MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), + [LagTransform(in_column="target", lags=[5, 6])], + ), + ], + ) + def test_forecast_in_sample_full_no_target_failed_assertion_error(self, model, transforms, example_tsds): + self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) + @to_be_fixed(raises=NotImplementedError, match="It is not possible to make in-sample predictions") @pytest.mark.parametrize( "model, transforms", @@ -181,7 +181,6 @@ class TestForecastInSampleFull: (HoltModel(), []), (HoltWintersModel(), []), (SimpleExpSmoothingModel(), []), - (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), ], ) def test_forecast_in_sample_full(self, model, transforms, example_tsds): @@ -200,19 +199,6 @@ def test_forecast_in_sample_full_failed_nans_lags(self, model, transforms, examp with pytest.raises(ValueError, match="Input contains NaN, infinity or a value too large"): _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") - @pytest.mark.parametrize( - "model, transforms", - [ - ( - MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), - [LagTransform(in_column="target", lags=[2, 3])], - ), - ], - ) - def test_forecast_in_sample_full_failed_nans_lags_nns(self, model, transforms, example_tsds): - with pytest.raises(AssertionError): - _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") - @pytest.mark.parametrize( "model, transforms", [ @@ -226,6 +212,21 @@ def test_forecast_in_sample_full_failed_not_enough_context(self, model, transfor with pytest.raises(ValueError, match="Given context isn't big enough"): _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") + @to_be_fixed(raises=AssertionError) + # Looks like a problem of current implementation of NNs + @pytest.mark.parametrize( + "model, transforms", + [ + (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), + ( + MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), + [LagTransform(in_column="target", lags=[2, 3])], + ), + ], + ) + def test_forecast_in_sample_full_failed_nans_lags_nns(self, model, transforms, example_tsds): + _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") + @to_be_fixed(raises=NotImplementedError, match="It is not possible to make in-sample predictions") @pytest.mark.parametrize( "model, transforms", @@ -548,7 +549,7 @@ def _test_forecast_out_sample_suffix(ts, model, transforms, full_prediction_size # firstly we should forecast prefix to use it as a context forecast_prefix_ts = deepcopy(forecast_gap_ts) forecast_prefix_ts.df = forecast_prefix_ts.df.iloc[:-suffix_prediction_size] - model.forecast(forecast_prefix_ts, prediction_size=prediction_size_diff) + forecast_prefix_ts = model.forecast(forecast_prefix_ts, prediction_size=prediction_size_diff) forecast_gap_ts.df = forecast_gap_ts.df.combine_first(forecast_prefix_ts.df) # forecast suffix with known context for it @@ -583,6 +584,10 @@ def _test_forecast_out_sample_suffix(ts, model, transforms, full_prediction_size (SeasonalMovingAverageModel(), []), (NaiveModel(lag=3), []), (DeadlineMovingAverageModel(window=1), []), + ( + MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), + [LagTransform(in_column="target", lags=[5, 6])], + ), ], ) def test_forecast_out_sample_suffix(self, model, transforms, example_tsds): @@ -594,10 +599,6 @@ def test_forecast_out_sample_suffix(self, model, transforms, example_tsds): "model, transforms", [ (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), - ( - MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), - [LagTransform(in_column="target", lags=[5, 6])], - ), ], ) def test_forecast_out_sample_suffix_failed_assertion_error(self, model, transforms, example_tsds): From dd4c630b26dd719d9c75f24b88e3b401d7cabb19 Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Fri, 10 Feb 2023 11:34:26 +0300 Subject: [PATCH 2/8] Update changelog --- CHANGELOG.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 921fdc1e8..1661a59fd 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -25,7 +25,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 - - ### Fixed -- +- Fix alignment during forecasting in new NNs ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) - Fix `MeanSegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1104](https://github.com/tinkoff-ai/etna/pull/1104)) - - Fix `SegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1103](https://github.com/tinkoff-ai/etna/pull/1103)) From ebbabe27804a3be0a512268261026e4cde5e97d2 Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Tue, 21 Feb 2023 17:19:21 +0300 Subject: [PATCH 3/8] Mark test test_forecast_out_sample_suffix_failed_rnn --- tests/test_models/test_inference/test_forecast.py | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/tests/test_models/test_inference/test_forecast.py b/tests/test_models/test_inference/test_forecast.py index 9b75b50b8..c74ee7269 100644 --- a/tests/test_models/test_inference/test_forecast.py +++ b/tests/test_models/test_inference/test_forecast.py @@ -594,16 +594,19 @@ def _test_forecast_out_sample_suffix(ts, model, transforms, full_prediction_size def test_forecast_out_sample_suffix(self, model, transforms, example_tsds): self._test_forecast_out_sample_suffix(example_tsds, model, transforms) - @to_be_fixed(raises=AssertionError) - # Looks like a problem of current implementation of NNs @pytest.mark.parametrize( "model, transforms", [ (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), ], ) - def test_forecast_out_sample_suffix_failed_assertion_error(self, model, transforms, example_tsds): - self._test_forecast_out_sample_suffix(example_tsds, model, transforms) + def test_forecast_out_sample_suffix_failed_rnn(self, model, transforms, example_tsds): + """This test is expected to fail due to autoregression in RNN. + + More about it in issue: https://github.com/tinkoff-ai/etna/issues/1087 + """ + with pytest.raises(AssertionError): + self._test_forecast_out_sample_suffix(example_tsds, model, transforms) @to_be_fixed(raises=NotImplementedError, match="You can only forecast from the next point after the last one") @pytest.mark.parametrize( From de7ffbd84e74ce3d2430fb7ea4c831f5f7dce28f Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Tue, 21 Feb 2023 17:39:35 +0300 Subject: [PATCH 4/8] Fix error message for seasonal-ma, deadline-ma if context isn't big enough, add check on size of context for DeepBaseModel and test for it --- etna/models/base.py | 6 ++++++ etna/models/deadline_ma.py | 4 ++-- etna/models/seasonal_ma.py | 4 ++-- tests/test_models/test_base.py | 7 +++++++ tests/test_models/test_inference/test_forecast.py | 2 +- 5 files changed, 18 insertions(+), 5 deletions(-) diff --git a/etna/models/base.py b/etna/models/base.py index cfc1cb7a7..cf307de53 100644 --- a/etna/models/base.py +++ b/etna/models/base.py @@ -622,6 +622,12 @@ def forecast(self, ts: "TSDataset", prediction_size: int) -> "TSDataset": : Dataset with predictions """ + expected_length = prediction_size + self.encoder_length + if len(ts.index) < expected_length: + raise ValueError( + "Given context isn't big enough, try to decrease context_size, prediction_size or increase length of given dataset!" + ) + test_dataset = ts.to_torch_dataset( make_samples=functools.partial( self.net.make_samples, encoder_length=self.encoder_length, decoder_length=prediction_size diff --git a/etna/models/deadline_ma.py b/etna/models/deadline_ma.py index 8549d4c68..80bb49893 100644 --- a/etna/models/deadline_ma.py +++ b/etna/models/deadline_ma.py @@ -119,7 +119,7 @@ def _get_context_beginning( # if we have len(history_timestamps) == 0, then len(df) <= prediction_size if len(history_timestamps) == 0: raise ValueError( - "Given context isn't big enough, try to decrease context_size, prediction_size of increase length of given dataframe!" + "Given context isn't big enough, try to decrease context_size, prediction_size or increase length of given dataframe!" ) if seasonality is SeasonalityMode.month: @@ -130,7 +130,7 @@ def _get_context_beginning( if first_index < history_timestamps.iloc[0]: raise ValueError( - "Given context isn't big enough, try to decrease context_size, prediction_size of increase length of given dataframe!" + "Given context isn't big enough, try to decrease context_size, prediction_size or increase length of given dataframe!" ) return first_index diff --git a/etna/models/seasonal_ma.py b/etna/models/seasonal_ma.py index 99fc8d588..d4bfd5d02 100644 --- a/etna/models/seasonal_ma.py +++ b/etna/models/seasonal_ma.py @@ -88,7 +88,7 @@ def forecast(self, df: pd.DataFrame, prediction_size: int) -> np.ndarray: expected_length = prediction_size + self.shift if len(df) < expected_length: raise ValueError( - "Given context isn't big enough, try to decrease context_size, prediction_size of increase length of given dataframe!" + "Given context isn't big enough, try to decrease context_size, prediction_size or increase length of given dataframe!" ) history = df["target"][-expected_length:-prediction_size] @@ -127,7 +127,7 @@ def predict(self, df: pd.DataFrame, prediction_size: int) -> np.ndarray: expected_length = prediction_size + self.shift if len(df) < expected_length: raise ValueError( - "Given context isn't big enough, try to decrease context_size, prediction_size of increase length of given dataframe!" + "Given context isn't big enough, try to decrease context_size, prediction_size or increase length of given dataframe!" ) context = df["target"][-expected_length:].values diff --git a/tests/test_models/test_base.py b/tests/test_models/test_base.py index 9ae93dffc..bd6b5bb20 100644 --- a/tests/test_models/test_base.py +++ b/tests/test_models/test_base.py @@ -14,6 +14,7 @@ @pytest.fixture() def deep_base_model_mock(): model = MagicMock() + model.encoder_length = 10 model.train_batch_size = 32 model.train_dataloader_params = {} model.val_dataloader_params = {} @@ -145,6 +146,12 @@ def test_deep_base_model_forecast_inverse_transform_call_check(deep_base_model_m ts.tsdataset_idx_slice.return_value.inverse_transform.assert_called_once() +def test_deep_base_model_forecast_fail_not_enough_context(deep_base_model_mock, sized_torch_dataset_mock): + horizon = len(sized_torch_dataset_mock) + with pytest.raises(ValueError, match="Given context isn't big enough"): + _ = DeepBaseModel.forecast(self=deep_base_model_mock, ts=sized_torch_dataset_mock, prediction_size=horizon) + + def test_deep_base_model_forecast_loop(simple_df, deep_base_model_mock): ts = MagicMock() ts_after_tsdataset_idx_slice = MagicMock() diff --git a/tests/test_models/test_inference/test_forecast.py b/tests/test_models/test_inference/test_forecast.py index c74ee7269..92992c523 100644 --- a/tests/test_models/test_inference/test_forecast.py +++ b/tests/test_models/test_inference/test_forecast.py @@ -106,6 +106,7 @@ def test_forecast_in_sample_full_no_target_failed_nans_lags(self, model, transfo (NaiveModel(lag=3), []), (SeasonalMovingAverageModel(), []), (DeadlineMovingAverageModel(window=1), []), + (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), ], ) def test_forecast_in_sample_full_no_target_failed_not_enough_context(self, model, transforms, example_tsds): @@ -117,7 +118,6 @@ def test_forecast_in_sample_full_no_target_failed_not_enough_context(self, model @pytest.mark.parametrize( "model, transforms", [ - (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), ( MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), [LagTransform(in_column="target", lags=[5, 6])], From b87699f8ac71460f8edf10a5f41b990c1967c1f4 Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Tue, 21 Feb 2023 20:26:50 +0300 Subject: [PATCH 5/8] Add check on NaNs for MLP and tests for it --- CHANGELOG.md | 2 +- etna/models/nn/mlp.py | 4 ++ tests/test_models/nn/test_mlp.py | 23 +++++++- tests/test_models/test_base.py | 29 +++++----- .../test_inference/test_forecast.py | 53 +++++++++++-------- .../test_inference/test_predict.py | 2 +- 6 files changed, 75 insertions(+), 38 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 7810cc5f8..6970d5c27 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -26,7 +26,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 - ### Fixed - Fix inference tests on new segments for `DeepARModel` and `TFTModel` ([#1109](https://github.com/tinkoff-ai/etna/pull/1109)) -- Fix alignment during forecasting in new NNs ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) +- Fix alignment during forecasting in new NNs, add exception on too small context in new NNs, add exception when there are NaNs during prediction by `MLPModel` ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) - Fix `MeanSegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1104](https://github.com/tinkoff-ai/etna/pull/1104)) - - Fix `SegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1103](https://github.com/tinkoff-ai/etna/pull/1103)) diff --git a/etna/models/nn/mlp.py b/etna/models/nn/mlp.py index 3887b58a8..6527c24f9 100644 --- a/etna/models/nn/mlp.py +++ b/etna/models/nn/mlp.py @@ -79,6 +79,8 @@ def forward(self, batch: MLPBatch): # type: ignore forecast """ decoder_real = batch["decoder_real"].float() + if decoder_real.isnan().sum().item(): + raise ValueError("There are NaNs in features, this model can't work with them!") return self.mlp(decoder_real) def step(self, batch: MLPBatch, *args, **kwargs): # type: ignore @@ -95,6 +97,8 @@ def step(self, batch: MLPBatch, *args, **kwargs): # type: ignore """ decoder_real = batch["decoder_real"].float() decoder_target = batch["decoder_target"].float() + if decoder_real.isnan().sum().item(): + raise ValueError("There are NaNs in features, this model can't work with them!") output = self.mlp(decoder_real) loss = self.loss(output, decoder_target) diff --git a/tests/test_models/nn/test_mlp.py b/tests/test_models/nn/test_mlp.py index 639305244..aed7f9448 100644 --- a/tests/test_models/nn/test_mlp.py +++ b/tests/test_models/nn/test_mlp.py @@ -24,7 +24,6 @@ ], ) def test_mlp_model_run_weekly_overfit_with_scaler(ts_dataset_weekly_function_with_horizon, horizon): - ts_train, ts_test = ts_dataset_weekly_function_with_horizon(horizon) lag = LagTransform(in_column="target", lags=list(range(horizon, horizon + 4))) fourier = FourierTransform(period=7, order=3) @@ -80,6 +79,17 @@ def test_mlp_make_samples(simple_df_relevance): np.testing.assert_equal(df[["target"]].iloc[decoder_length : 2 * decoder_length], second_sample["decoder_target"]) +def test_mlp_forward_fail_nans(): + batch = { + "decoder_real": torch.Tensor([[torch.nan, 2, 3], [1, 2, 3], [1, 2, 3]]), + "decoder_target": torch.Tensor([[1], [2], [3]]), + "segment": "A", + } + model = MLPNet(input_size=3, hidden_size=[1], lr=1e-2, loss=nn.MSELoss(), optimizer_params=None) + with pytest.raises(ValueError, match="There are NaNs in features"): + _ = model.forward(batch) + + def test_mlp_step(): batch = { @@ -96,6 +106,17 @@ def test_mlp_step(): assert output.shape == torch.Size([3, 1]) +def test_mlp_step_fail_nans(): + batch = { + "decoder_real": torch.Tensor([[torch.nan, 2, 3], [1, 2, 3], [1, 2, 3]]), + "decoder_target": torch.Tensor([[1], [2], [3]]), + "segment": "A", + } + model = MLPNet(input_size=3, hidden_size=[1], lr=1e-2, loss=nn.MSELoss(), optimizer_params=None) + with pytest.raises(ValueError, match="There are NaNs in features"): + _ = model.step(batch) + + def test_mlp_layers(): model = MLPNet(input_size=3, hidden_size=[10], lr=1e-2, loss=None, optimizer_params=None) model_ = nn.Sequential( diff --git a/tests/test_models/test_base.py b/tests/test_models/test_base.py index bd6b5bb20..824285962 100644 --- a/tests/test_models/test_base.py +++ b/tests/test_models/test_base.py @@ -24,6 +24,13 @@ def deep_base_model_mock(): return model +@pytest.fixture() +def ts_mock(): + torch_dataset = MagicMock() + torch_dataset.index.__len__.return_value = 100 + return torch_dataset + + @pytest.fixture() def sized_torch_dataset_mock(): torch_dataset = MagicMock() @@ -139,21 +146,19 @@ def test_deep_base_model_raw_predict_call(dataloader, deep_base_model_mock): np.testing.assert_allclose(predictions_dict[("segment2", "target")], batch["target"][1].numpy()) -def test_deep_base_model_forecast_inverse_transform_call_check(deep_base_model_mock): - ts = MagicMock() +def test_deep_base_model_forecast_inverse_transform_call_check(deep_base_model_mock, ts_mock): horizon = 7 - DeepBaseModel.forecast(self=deep_base_model_mock, ts=ts, prediction_size=horizon) - ts.tsdataset_idx_slice.return_value.inverse_transform.assert_called_once() + DeepBaseModel.forecast(self=deep_base_model_mock, ts=ts_mock, prediction_size=horizon) + ts_mock.tsdataset_idx_slice.return_value.inverse_transform.assert_called_once() -def test_deep_base_model_forecast_fail_not_enough_context(deep_base_model_mock, sized_torch_dataset_mock): - horizon = len(sized_torch_dataset_mock) +def test_deep_base_model_forecast_fail_not_enough_context(deep_base_model_mock, ts_mock): + horizon = len(ts_mock.index) with pytest.raises(ValueError, match="Given context isn't big enough"): - _ = DeepBaseModel.forecast(self=deep_base_model_mock, ts=sized_torch_dataset_mock, prediction_size=horizon) + _ = DeepBaseModel.forecast(self=deep_base_model_mock, ts=ts_mock, prediction_size=horizon) -def test_deep_base_model_forecast_loop(simple_df, deep_base_model_mock): - ts = MagicMock() +def test_deep_base_model_forecast_loop(simple_df, deep_base_model_mock, ts_mock): ts_after_tsdataset_idx_slice = MagicMock() horizon = 7 @@ -161,13 +166,13 @@ def test_deep_base_model_forecast_loop(simple_df, deep_base_model_mock): deep_base_model_mock.raw_predict.return_value = raw_predict ts_after_tsdataset_idx_slice.df = simple_df.df.iloc[-horizon:] - ts.tsdataset_idx_slice.return_value = ts_after_tsdataset_idx_slice + ts_mock.tsdataset_idx_slice.return_value = ts_after_tsdataset_idx_slice - future = DeepBaseModel.forecast(self=deep_base_model_mock, ts=ts, prediction_size=horizon) + future = DeepBaseModel.forecast(self=deep_base_model_mock, ts=ts_mock, prediction_size=horizon) np.testing.assert_allclose( future.df.loc[:, pd.IndexSlice["A", "target"]], raw_predict[("A", "target")][:horizon, 0] ) np.testing.assert_allclose( future.df.loc[:, pd.IndexSlice["B", "target"]], raw_predict[("B", "target")][:horizon, 0] ) - ts.tsdataset_idx_slice.return_value.inverse_transform.assert_called_once() + ts_mock.tsdataset_idx_slice.return_value.inverse_transform.assert_called_once() diff --git a/tests/test_models/test_inference/test_forecast.py b/tests/test_models/test_inference/test_forecast.py index 92992c523..0d0588ede 100644 --- a/tests/test_models/test_inference/test_forecast.py +++ b/tests/test_models/test_inference/test_forecast.py @@ -95,10 +95,23 @@ def test_forecast_in_sample_full_no_target(self, model, transforms, example_tsds (ElasticMultiSegmentModel(), [LagTransform(in_column="target", lags=[2, 3])]), ], ) - def test_forecast_in_sample_full_no_target_failed_nans_lags(self, model, transforms, example_tsds): + def test_forecast_in_sample_full_no_target_failed_nans_sklearn(self, model, transforms, example_tsds): with pytest.raises(ValueError, match="Input contains NaN, infinity or a value too large"): self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) + @pytest.mark.parametrize( + "model, transforms", + [ + ( + MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), + [LagTransform(in_column="target", lags=[5, 6])], + ), + ], + ) + def test_forecast_in_sample_full_no_target_failed_nans_nn(self, model, transforms, example_tsds): + with pytest.raises(ValueError, match="There are NaNs in features"): + self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) + @pytest.mark.parametrize( "model, transforms", [ @@ -113,20 +126,6 @@ def test_forecast_in_sample_full_no_target_failed_not_enough_context(self, model with pytest.raises(ValueError, match="Given context isn't big enough"): self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) - @to_be_fixed(raises=AssertionError) - # Looks like a problem of current implementation of NNs - @pytest.mark.parametrize( - "model, transforms", - [ - ( - MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), - [LagTransform(in_column="target", lags=[5, 6])], - ), - ], - ) - def test_forecast_in_sample_full_no_target_failed_assertion_error(self, model, transforms, example_tsds): - self._test_forecast_in_sample_full_no_target(example_tsds, model, transforms) - @to_be_fixed(raises=NotImplementedError, match="It is not possible to make in-sample predictions") @pytest.mark.parametrize( "model, transforms", @@ -196,10 +195,23 @@ def test_forecast_in_sample_full(self, model, transforms, example_tsds): (ElasticMultiSegmentModel(), [LagTransform(in_column="target", lags=[2, 3])]), ], ) - def test_forecast_in_sample_full_failed_nans_lags(self, model, transforms, example_tsds): + def test_forecast_in_sample_full_failed_nans_sklearn(self, model, transforms, example_tsds): with pytest.raises(ValueError, match="Input contains NaN, infinity or a value too large"): _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") + @pytest.mark.parametrize( + "model, transforms", + [ + ( + MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), + [LagTransform(in_column="target", lags=[2, 3])], + ), + ], + ) + def test_forecast_in_sample_full_failed_nans_nn(self, model, transforms, example_tsds): + with pytest.raises(ValueError, match="There are NaNs in features"): + _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") + @pytest.mark.parametrize( "model, transforms", [ @@ -207,6 +219,7 @@ def test_forecast_in_sample_full_failed_nans_lags(self, model, transforms, examp (NaiveModel(lag=3), []), (SeasonalMovingAverageModel(), []), (DeadlineMovingAverageModel(window=1), []), + (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), ], ) def test_forecast_in_sample_full_failed_not_enough_context(self, model, transforms, example_tsds): @@ -217,13 +230,7 @@ def test_forecast_in_sample_full_failed_not_enough_context(self, model, transfor # Looks like a problem of current implementation of NNs @pytest.mark.parametrize( "model, transforms", - [ - (RNNModel(input_size=1, encoder_length=7, decoder_length=7, trainer_params=dict(max_epochs=1)), []), - ( - MLPModel(input_size=2, hidden_size=[10], decoder_length=7, trainer_params=dict(max_epochs=1)), - [LagTransform(in_column="target", lags=[2, 3])], - ), - ], + [], ) def test_forecast_in_sample_full_failed_nans_lags_nns(self, model, transforms, example_tsds): _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="forecast") diff --git a/tests/test_models/test_inference/test_predict.py b/tests/test_models/test_inference/test_predict.py index eebfedb64..a89d462e9 100644 --- a/tests/test_models/test_inference/test_predict.py +++ b/tests/test_models/test_inference/test_predict.py @@ -74,7 +74,7 @@ def test_predict_in_sample_full(self, model, transforms, example_tsds): (ElasticMultiSegmentModel(), [LagTransform(in_column="target", lags=[2, 3])]), ], ) - def test_predict_in_sample_full_failed_not_enough_context(self, model, transforms, example_tsds): + def test_predict_in_sample_full_failed_nans_sklearn(self, model, transforms, example_tsds): with pytest.raises(ValueError, match="Input contains NaN, infinity or a value too large"): _test_prediction_in_sample_full(example_tsds, model, transforms, method_name="predict") From 38d393661178a34b7246bb2db80654a4bf688c82 Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Tue, 21 Feb 2023 20:30:48 +0300 Subject: [PATCH 6/8] Refactor validation of batch in MLPNet --- etna/models/nn/mlp.py | 11 +++++++---- 1 file changed, 7 insertions(+), 4 deletions(-) diff --git a/etna/models/nn/mlp.py b/etna/models/nn/mlp.py index 6527c24f9..034b1b252 100644 --- a/etna/models/nn/mlp.py +++ b/etna/models/nn/mlp.py @@ -66,6 +66,11 @@ def __init__( layers.append(nn.Linear(in_features=hidden_size[-1], out_features=1)) self.mlp = nn.Sequential(*layers) + @staticmethod + def _validate_batch(batch: MLPBatch): + if batch["decoder_real"].isnan().sum().item(): + raise ValueError("There are NaNs in features, this model can't work with them!") + def forward(self, batch: MLPBatch): # type: ignore """Forward pass. @@ -78,9 +83,8 @@ def forward(self, batch: MLPBatch): # type: ignore : forecast """ + self._validate_batch(batch) decoder_real = batch["decoder_real"].float() - if decoder_real.isnan().sum().item(): - raise ValueError("There are NaNs in features, this model can't work with them!") return self.mlp(decoder_real) def step(self, batch: MLPBatch, *args, **kwargs): # type: ignore @@ -95,10 +99,9 @@ def step(self, batch: MLPBatch, *args, **kwargs): # type: ignore : loss, true_target, prediction_target """ + self._validate_batch(batch) decoder_real = batch["decoder_real"].float() decoder_target = batch["decoder_target"].float() - if decoder_real.isnan().sum().item(): - raise ValueError("There are NaNs in features, this model can't work with them!") output = self.mlp(decoder_real) loss = self.loss(output, decoder_target) From da0d5a8c6f1c041fbb7ea7cc5158c08660141355 Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Tue, 21 Feb 2023 20:31:26 +0300 Subject: [PATCH 7/8] Update changelog --- CHANGELOG.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 6970d5c27..565328815 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -26,7 +26,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 - ### Fixed - Fix inference tests on new segments for `DeepARModel` and `TFTModel` ([#1109](https://github.com/tinkoff-ai/etna/pull/1109)) -- Fix alignment during forecasting in new NNs, add exception on too small context in new NNs, add exception when there are NaNs during prediction by `MLPModel` ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) +- Fix alignment during forecasting in new NNs, add exception on too small context in new NNs, add validation of batch in `MLPNet` ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) - Fix `MeanSegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1104](https://github.com/tinkoff-ai/etna/pull/1104)) - - Fix `SegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1103](https://github.com/tinkoff-ai/etna/pull/1103)) From af666cb10b77377c06f95b346ed32f23f2304836 Mon Sep 17 00:00:00 2001 From: "d.a.bunin" Date: Tue, 21 Feb 2023 20:32:00 +0300 Subject: [PATCH 8/8] Update changelog --- CHANGELOG.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 565328815..14bc9f578 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -26,7 +26,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 - ### Fixed - Fix inference tests on new segments for `DeepARModel` and `TFTModel` ([#1109](https://github.com/tinkoff-ai/etna/pull/1109)) -- Fix alignment during forecasting in new NNs, add exception on too small context in new NNs, add validation of batch in `MLPNet` ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) +- Fix alignment during forecasting in new NNs, add validation of context size during forecasting in new NNs, add validation of batch in `MLPNet` ([#1108](https://github.com/tinkoff-ai/etna/pull/1108)) - Fix `MeanSegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1104](https://github.com/tinkoff-ai/etna/pull/1104)) - - Fix `SegmentEncoderTransform` to work with subset of segments and raise error on new segments ([#1103](https://github.com/tinkoff-ai/etna/pull/1103))