From 8322f9a474f4a31ea5ba17111a05cd849fd60d4e Mon Sep 17 00:00:00 2001 From: Ruth Comer Date: Thu, 29 Sep 2022 15:59:09 +0100 Subject: [PATCH 1/5] Enable lazy RMS aggregation with weights Note that the referenced dask issue was fixed by dask#4236 which was included in v1.1.0. --- lib/iris/analysis/__init__.py | 22 ++++------------ lib/iris/tests/unit/analysis/test_RMS.py | 32 ++++++++---------------- 2 files changed, 15 insertions(+), 39 deletions(-) diff --git a/lib/iris/analysis/__init__.py b/lib/iris/analysis/__init__.py index f34cda1402..76d769cf61 100644 --- a/lib/iris/analysis/__init__.py +++ b/lib/iris/analysis/__init__.py @@ -1583,27 +1583,15 @@ def _lazy_max_run(array, axis=-1, **kwargs): def _rms(array, axis, **kwargs): - # XXX due to the current limitations in `da.average` (see below), maintain - # an explicit non-lazy aggregation function for now. - # Note: retaining this function also means that if weights are passed to - # the lazy aggregator, the aggregation will fall back to using this - # non-lazy aggregator. - rval = np.sqrt(ma.average(np.square(array), axis=axis, **kwargs)) - if not ma.isMaskedArray(array): - rval = np.asarray(rval) + rval = np.sqrt(ma.average(array**2, axis=axis, **kwargs)) + return rval -@_build_dask_mdtol_function def _lazy_rms(array, axis, **kwargs): - # XXX This should use `da.average` and not `da.mean`, as does the above. - # However `da.average` current doesn't handle masked weights correctly - # (see https://github.com/dask/dask/issues/3846). - # To work around this we use da.mean, which doesn't support weights at - # all. Thus trying to use this aggregator with weights will currently - # raise an error in dask due to the unexpected keyword `weights`, - # rather than silently returning the wrong answer. - return da.sqrt(da.mean(array**2, axis=axis, **kwargs)) + rval = da.sqrt(da.ma.average(array**2, axis=axis, **kwargs)) + + return rval def _sum(array, **kwargs): diff --git a/lib/iris/tests/unit/analysis/test_RMS.py b/lib/iris/tests/unit/analysis/test_RMS.py index 141b3e262b..74f309ce00 100644 --- a/lib/iris/tests/unit/analysis/test_RMS.py +++ b/lib/iris/tests/unit/analysis/test_RMS.py @@ -101,20 +101,16 @@ def test_1d_weighted(self): data = as_lazy_data(np.array([4, 7, 10, 8], dtype=np.float64)) weights = np.array([1, 4, 3, 2], dtype=np.float64) expected_rms = 8.0 - # https://github.com/dask/dask/issues/3846. - with self.assertRaisesRegex(TypeError, "unexpected keyword argument"): - rms = RMS.lazy_aggregate(data, 0, weights=weights) - self.assertAlmostEqual(rms, expected_rms) + rms = RMS.lazy_aggregate(data, 0, weights=weights) + self.assertAlmostEqual(rms, expected_rms) def test_1d_lazy_weighted(self): # 1-dimensional input with lazy weights. data = as_lazy_data(np.array([4, 7, 10, 8], dtype=np.float64)) weights = as_lazy_data(np.array([1, 4, 3, 2], dtype=np.float64)) expected_rms = 8.0 - # https://github.com/dask/dask/issues/3846. - with self.assertRaisesRegex(TypeError, "unexpected keyword argument"): - rms = RMS.lazy_aggregate(data, 0, weights=weights) - self.assertAlmostEqual(rms, expected_rms) + rms = RMS.lazy_aggregate(data, 0, weights=weights) + self.assertAlmostEqual(rms, expected_rms) def test_2d_weighted(self): # 2-dimensional input with weights. @@ -123,20 +119,16 @@ def test_2d_weighted(self): ) weights = np.array([[1, 4, 3, 2], [2, 1, 1.5, 0.5]], dtype=np.float64) expected_rms = np.array([8.0, 16.0], dtype=np.float64) - # https://github.com/dask/dask/issues/3846. - with self.assertRaisesRegex(TypeError, "unexpected keyword argument"): - rms = RMS.lazy_aggregate(data, 1, weights=weights) - self.assertArrayAlmostEqual(rms, expected_rms) + rms = RMS.lazy_aggregate(data, 1, weights=weights) + self.assertArrayAlmostEqual(rms, expected_rms) def test_unit_weighted(self): # Unit weights should be the same as no weights. data = as_lazy_data(np.array([5, 2, 6, 4], dtype=np.float64)) weights = np.ones_like(data) expected_rms = 4.5 - # https://github.com/dask/dask/issues/3846. - with self.assertRaisesRegex(TypeError, "unexpected keyword argument"): - rms = RMS.lazy_aggregate(data, 0, weights=weights) - self.assertAlmostEqual(rms, expected_rms) + rms = RMS.lazy_aggregate(data, 0, weights=weights) + self.assertAlmostEqual(rms, expected_rms) def test_masked(self): # Masked entries should be completely ignored. @@ -152,9 +144,6 @@ def test_masked(self): self.assertAlmostEqual(rms, expected_rms) def test_masked_weighted(self): - # Weights should work properly with masked arrays, but currently don't - # (see https://github.com/dask/dask/issues/3846). - # For now, masked weights are simply not supported. data = as_lazy_data( ma.array( [4, 7, 18, 10, 11, 8], @@ -164,9 +153,8 @@ def test_masked_weighted(self): ) weights = np.array([1, 4, 5, 3, 8, 2]) expected_rms = 8.0 - with self.assertRaisesRegex(TypeError, "unexpected keyword argument"): - rms = RMS.lazy_aggregate(data, 0, weights=weights) - self.assertAlmostEqual(rms, expected_rms) + rms = RMS.lazy_aggregate(data, 0, weights=weights) + self.assertAlmostEqual(rms, expected_rms) class Test_name(tests.IrisTest): From cd8f3e42eb43aacb46d0ed806233627d11292500 Mon Sep 17 00:00:00 2001 From: Ruth Comer Date: Fri, 7 Oct 2022 15:54:35 +0100 Subject: [PATCH 2/5] whatsnew --- docs/src/whatsnew/latest.rst | 3 +++ 1 file changed, 3 insertions(+) diff --git a/docs/src/whatsnew/latest.rst b/docs/src/whatsnew/latest.rst index b23687af7a..cafe840725 100644 --- a/docs/src/whatsnew/latest.rst +++ b/docs/src/whatsnew/latest.rst @@ -36,6 +36,9 @@ This document explains the changes made to Iris for this release :ref:`documentation page` for further information. (:pull:`5144`) +#. `@rcomer`_ enabled lazy evaluation of :obj:`~iris.analysis.RMS` calcuations + with weights. (:pull:`5016`) + 🐛 Bugs Fixed ============= From 9a87aacbaba9e3b98e579e73529d2b6a2d4659f5 Mon Sep 17 00:00:00 2001 From: Ruth Comer Date: Fri, 7 Oct 2022 16:05:17 +0100 Subject: [PATCH 3/5] docstring --- lib/iris/analysis/__init__.py | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/lib/iris/analysis/__init__.py b/lib/iris/analysis/__init__.py index 76d769cf61..87b3ae516c 100644 --- a/lib/iris/analysis/__init__.py +++ b/lib/iris/analysis/__init__.py @@ -2059,14 +2059,16 @@ def interp_order(length): the root mean square over a :class:`~iris.cube.Cube`, as computed by ((x0**2 + x1**2 + ... + xN-1**2) / N) ** 0.5. -Additional kwargs associated with the use of this aggregator: +Parameters +---------- -* weights (float ndarray): +weights : array-like, optional Weights matching the shape of the cube or the length of the window for rolling window operations. The weights are applied to the squares when taking the mean. -**For example**: +Example +------- To compute the zonal root mean square over the *longitude* axis of a cube:: From 1fc6cf7253cf6f98cc586bf93b934c1b3dc71802 Mon Sep 17 00:00:00 2001 From: Ruth Comer Date: Fri, 7 Oct 2022 16:41:20 +0100 Subject: [PATCH 4/5] add note about NEP13/18 not applying --- lib/iris/analysis/__init__.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/lib/iris/analysis/__init__.py b/lib/iris/analysis/__init__.py index 87b3ae516c..c80469c3c7 100644 --- a/lib/iris/analysis/__init__.py +++ b/lib/iris/analysis/__init__.py @@ -1589,6 +1589,10 @@ def _rms(array, axis, **kwargs): def _lazy_rms(array, axis, **kwargs): + # Note that, since we specifically need the ma version of average to handle + # weights correctly with masked data, we cannot rely on NEP13/18 and need + # to implement a separate lazy RMS function. + rval = da.sqrt(da.ma.average(array**2, axis=axis, **kwargs)) return rval From 7ba83ef6a9dc1c71e83b10b7bb047a58b7d3543c Mon Sep 17 00:00:00 2001 From: Ruth Comer Date: Mon, 27 Feb 2023 11:07:34 +0000 Subject: [PATCH 5/5] whatsnew PR num fix --- docs/src/whatsnew/latest.rst | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docs/src/whatsnew/latest.rst b/docs/src/whatsnew/latest.rst index cafe840725..8882dccd85 100644 --- a/docs/src/whatsnew/latest.rst +++ b/docs/src/whatsnew/latest.rst @@ -37,7 +37,7 @@ This document explains the changes made to Iris for this release (:pull:`5144`) #. `@rcomer`_ enabled lazy evaluation of :obj:`~iris.analysis.RMS` calcuations - with weights. (:pull:`5016`) + with weights. (:pull:`5017`) 🐛 Bugs Fixed