shwina · shwina · Mar 15, 2022 · Mar 10, 2022 · Mar 14, 2022 · crusaderky
diff --git a/dask_cuda/device_host_file.py b/dask_cuda/device_host_file.py
@@ -260,6 +260,16 @@ def __delitem__(self, key):
         self.device_keys.discard(key)
         del self.device_buffer[key]
 
+    def evict(self):
+        """Evicts least recently used host buffer (aka, CPU or system memory)
+
+        Implements distributed.spill.ManualEvictProto interface"""
+        try:
+            _, _, weight = self.host_buffer.fast.evict()
+            return weight
+        except Exception:  # We catch all `Exception`s, just like zict.LRU
+            return -1
+
     def set_address(self, addr):
         if isinstance(self.host_buffer, LoggedBuffer):
             self.host_buffer.set_address(addr)

diff --git a/dask_cuda/tests/test_spill.py b/dask_cuda/tests/test_spill.py
@@ -84,7 +84,7 @@ def delayed_worker_assert(total_size, device_chunk_overhead, serialized_chunk_ov
     [
         {
             "device_memory_limit": int(200e6),
-            "memory_limit": int(800e6),
+            "memory_limit": int(2000e6),
             "host_target": False,
             "host_spill": False,
             "host_pause": False,
@@ -98,6 +98,16 @@ def delayed_worker_assert(total_size, device_chunk_overhead, serialized_chunk_ov
             "host_pause": False,
             "spills_to_disk": True,
         },
+        {
+            # This test setup differs from the one above as Distributed worker
+            # pausing is enabled and thus triggers `DeviceHostFile.evict()`
+            "device_memory_limit": int(200e6),
+            "memory_limit": int(1000e6),
+            "host_target": None,
+            "host_spill": None,
+            "host_pause": None,
+            "spills_to_disk": True,
+        },
         {
             "device_memory_limit": int(200e6),
             "memory_limit": None,
@@ -159,7 +169,7 @@ async def test_cupy_cluster_device_spill(params):
     [
         {
             "device_memory_limit": int(200e6),
-            "memory_limit": int(800e6),
+            "memory_limit": int(4000e6),
             "host_target": False,
             "host_spill": False,
             "host_pause": False,
@@ -173,6 +183,16 @@ async def test_cupy_cluster_device_spill(params):
             "host_pause": False,
             "spills_to_disk": True,
         },
+        {
+            # This test setup differs from the one above as Distributed worker
+            # pausing is enabled and thus triggers `DeviceHostFile.evict()`
+            "device_memory_limit": int(200e6),
+            "memory_limit": int(2000e6),
+            "host_target": None,
+            "host_spill": None,
+            "host_pause": None,
+            "spills_to_disk": True,
+        },
         {
             "device_memory_limit": int(200e6),
             "memory_limit": None,