rapidsai · rapids-bot · Nov 17, 2022 · Nov 8, 2022 · Nov 14, 2022 · Nov 14, 2022
@@ -43,7 +43,14 @@
         utils.JIT_SUPPORTED_TYPES |= STRING_TYPES
         _supported_masked_types |= {string_view}
 
-        utils.launch_arg_getters[cudf_str_dtype] = column_to_string_view_array
+        def column_to_string_view_array_init_heap(col):
+            # lazily allocate heap only when a string needs to be returned
+            strings_udf.set_malloc_heap_size()
+            return column_to_string_view_array(col)
+
+        utils.launch_arg_getters[
+            cudf_str_dtype
+        ] = column_to_string_view_array_init_heap
         utils.output_col_getters[cudf_str_dtype] = column_from_udf_string_array
         utils.masked_array_types[cudf_str_dtype] = string_view
         row_function.itemsizes[cudf_str_dtype] = string_view.size_bytes

@@ -3,6 +3,7 @@
 import os
 
 from cubinlinker.patch import _numba_version_ok, get_logger, new_patched_linker
+from cuda import cudart
 from numba import cuda
 from numba.cuda.cudadrv.driver import Linker
 from ptxcompiler.patch import NO_DRIVER, safe_get_versions
@@ -87,6 +88,26 @@ def _get_ptx_file():
         return regular_result[1]
 
 
+default_heap_size = int(2e6)
+heap_size = 0
+
+
+def set_malloc_heap_size(size=default_heap_size):
+    """
+    Heap size control for strings_udf, size in bytes.
+    """
+    global heap_size
+    if size == heap_size:
+        return
+    else:
+        (ret,) = cudart.cudaDeviceSetLimit(cudart.cudaLimit(2), size)
+        if ret.value != 0:
+            breakpoint()
+            raise RuntimeError("Unable to set cudaMalloc heap size")
+
+        heap_size = size
+
+
 ptxpath = None
 versions = safe_get_versions()
 if versions != NO_DRIVER: