pydata · shoyer · Apr 19, 2016 · Apr 16, 2016 · Apr 16, 2016 · Apr 16, 2016
diff --git a/doc/whats-new.rst b/doc/whats-new.rst
@@ -22,10 +22,26 @@ This release includes
 
 Enhancements
 ~~~~~~~~~~~~
+
 - DataArray and Dataset method :py:meth:`where` now supports a ``drop=True``
   option that clips coordinate elements that are fully masked.  By
   `Phillip J. Wolfram <https://github.com/pwolfram>`_.
 
+- DataArray and Dataset method :py:meth:`resample` now supports the 
+  ``keep_attrs=False`` option that determines whether variable and dataset
+  attributes are retained in the resampled object. By
+  `Jeremy McGibbon <https://github.com/mcgibbon>`_.
+
+Bug fixes
+~~~~~~~~~
+
+- Attributes were being retained by default for some resampling
+  operations when they should not. With the ``keep_attrs=False`` option, they
+  will no longer be retained by default. This may be backwards-incompatible
+  with some scripts, but the attributes may be kept by adding the
+  ``keep_attrs=True`` option. By
+  `Jeremy McGibbon <https://github.com/mcgibbon>`_.
+
 .. _whats-new.0.7.2:
 
 v0.7.2 (13 March 2016)

diff --git a/xarray/core/common.py b/xarray/core/common.py
@@ -374,7 +374,7 @@ def rolling(self, min_periods=None, center=False, **windows):
                                 center=center, **windows)
 
     def resample(self, freq, dim, how='mean', skipna=None, closed=None,
-                 label=None, base=0):
+                 label=None, base=0, keep_attrs=False):
         """Resample this object to a new temporal resolution.
 
         Handles both downsampling and upsampling. Upsampling with filling is
@@ -418,6 +418,10 @@ def resample(self, freq, dim, how='mean', skipna=None, closed=None,
             For frequencies that evenly subdivide 1 day, the "origin" of the
             aggregated intervals. For example, for '24H' frequency, base could
             range from 0 through 23.
+        keep_attrs : bool, optional
+            If True, the object's attributes (`attrs`) will be copied from
+            the original object to the new one.  If False (default), the new
+            object will be returned without attributes.
 
         Returns
         -------
@@ -441,11 +445,11 @@ def resample(self, freq, dim, how='mean', skipna=None, closed=None,
         if isinstance(how, basestring):
             f = getattr(gb, how)
             if how in ['first', 'last']:
-                result = f(skipna=skipna)
+                result = f(skipna=skipna, keep_attrs=keep_attrs)
             else:
-                result = f(dim=dim.name, skipna=skipna)
+                result = f(dim=dim.name, skipna=skipna, keep_attrs=keep_attrs)
         else:
-            result = gb.reduce(how, dim=dim.name)
+            result = gb.reduce(how, dim=dim.name, keep_attrs=keep_attrs)
         result = result.rename({RESAMPLE_DIM: dim.name})
         return result
 

diff --git a/xarray/core/groupby.py b/xarray/core/groupby.py
@@ -320,7 +320,6 @@ def _concat_shortcut(self, applied, concat_dim, positions):
         # compiled language)
         stacked = Variable.concat(
             applied, concat_dim, positions, shortcut=True)
-        stacked.attrs.update(self.obj.attrs)
         result = self.obj._replace_maybe_drop_dims(stacked)
         result._coords[concat_dim.name] = as_variable(concat_dim, copy=True)
         return result

diff --git a/xarray/test/test_dataarray.py b/xarray/test/test_dataarray.py
@@ -1407,6 +1407,32 @@ def test_resample_first(self):
                              name='time')
         self.assertDataArrayIdentical(expected, actual)
 
+    def test_resample_first_keep_attrs(self):
+        times = pd.date_range('2000-01-01', freq='6H', periods=10)
+        array = DataArray(np.arange(10), [('time', times)])
+        array.attrs['meta'] = 'data'
+
+        resampled_array = array.resample('1D', dim='time', how='first', keep_attrs=True)
+        actual = resampled_array.attrs
+        expected = array.attrs
+        self.assertEqual(expected, actual)
+
+        resampled_array = array.resample('1D', dim='time', how='first', keep_attrs=False)
+        assert resampled_array.attrs == {}
+
+    def test_resample_mean_keep_attrs(self):
+        times = pd.date_range('2000-01-01', freq='6H', periods=10)
+        array = DataArray(np.arange(10), [('time', times)])
+        array.attrs['meta'] = 'data'
+
+        resampled_array = array.resample('1D', dim='time', how='mean', keep_attrs=True)
+        actual = resampled_array.attrs
+        expected = array.attrs
+        self.assertEqual(expected, actual)
+
+        resampled_array = array.resample('1D', dim='time', how='mean', keep_attrs=False)
+        assert resampled_array.attrs == {}
+
     def test_resample_skipna(self):
         times = pd.date_range('2000-01-01', freq='6H', periods=10)
         array = DataArray(np.ones(10), [('time', times)])

diff --git a/xarray/test/test_dataset.py b/xarray/test/test_dataset.py
@@ -1647,7 +1647,7 @@ def test_resample_and_first(self):
                       'bar': ('time', np.random.randn(10), {'meta': 'data'}),
                       'time': times})
 
-        actual = ds.resample('1D', dim='time', how='first')
+        actual = ds.resample('1D', dim='time', how='first', keep_attrs=True)
         expected = ds.isel(time=[0, 4, 8])
         self.assertDatasetIdentical(expected, actual)
 
@@ -1658,6 +1658,46 @@ def test_resample_and_first(self):
             actual = ds.resample('3H', 'time', how=how)
             self.assertDatasetEqual(expected, actual)
 
+    def test_resample_by_mean_with_keep_attrs(self):
+        times = pd.date_range('2000-01-01', freq='6H', periods=10)
+        ds = Dataset({'foo': (['time', 'x', 'y'], np.random.randn(10, 5, 3)),
+                      'bar': ('time', np.random.randn(10), {'meta': 'data'}),
+                      'time': times})
+        ds.attrs['dsmeta'] = 'dsdata'
+
+        resampled_ds = ds.resample('1D', dim='time', how='mean', keep_attrs=True)
+        actual = resampled_ds['bar'].attrs
+        expected = ds['bar'].attrs
+        self.assertEqual(expected, actual)
+
+        actual = resampled_ds.attrs
+        expected = ds.attrs
+        self.assertEqual(expected, actual)
+
+    def test_resample_by_mean_discarding_attrs(self):
+        times = pd.date_range('2000-01-01', freq='6H', periods=10)
+        ds = Dataset({'foo': (['time', 'x', 'y'], np.random.randn(10, 5, 3)),
+                      'bar': ('time', np.random.randn(10), {'meta': 'data'}),
+                      'time': times})
+        ds.attrs['dsmeta'] = 'dsdata'
+
+        resampled_ds = ds.resample('1D', dim='time', how='mean', keep_attrs=False)
+
+        assert resampled_ds['bar'].attrs == {}
+        assert resampled_ds.attrs == {}
+
+    def test_resample_by_last_discarding_attrs(self):
+        times = pd.date_range('2000-01-01', freq='6H', periods=10)
+        ds = Dataset({'foo': (['time', 'x', 'y'], np.random.randn(10, 5, 3)),
+                      'bar': ('time', np.random.randn(10), {'meta': 'data'}),
+                      'time': times})
+        ds.attrs['dsmeta'] = 'dsdata'
+
+        resampled_ds = ds.resample('1D', dim='time', how='last', keep_attrs=False)
+
+        assert resampled_ds['bar'].attrs == {}
+        assert resampled_ds.attrs == {}
+
     def test_to_array(self):
         ds = Dataset(OrderedDict([('a', 1), ('b', ('x', [1, 2, 3]))]),
                      coords={'c': 42}, attrs={'Conventions': 'None'})