Add GPU memory guard to reproject dask+cupy path (#1131)

brendancol · web-flow · commit 617aac378557 · 2026-03-31T12:47:15.000-07:00
* Add sweep-performance design spec Parallel subagent triage + ralph-loop workflow for auditing all xrspatial modules for performance bottlenecks, OOM risk under 30TB dask workloads, and backend-specific anti-patterns. * Add sweep-performance implementation plan 7 tasks covering command scaffold, module scoring, parallel subagent dispatch, report merging, ralph-loop generation, and smoke tests. * Add sweep-performance slash command * Add GPU memory guard to reproject _reproject_dask_cupy (#1130)
diff --git a/xrspatial/reproject/__init__.py b/xrspatial/reproject/__init__.py
@@ -999,6 +999,19 @@ def _reproject_dask_cupy(
     src_res_x = (src_right - src_left) / src_w
     src_res_y = (src_top - src_bottom) / src_h
 
+    # Memory guard: the full output is allocated on GPU.
+    estimated = out_shape[0] * out_shape[1] * 8  # float64
+    try:
+        free_gpu, _total = cp.cuda.Device().mem_info
+        if estimated > 0.8 * free_gpu:
+            raise MemoryError(
+                f"_reproject_dask_cupy needs ~{estimated / 1e9:.1f} GB on GPU "
+                f"for the full output but only ~{free_gpu / 1e9:.1f} GB free.  "
+                f"Reduce output resolution or use the dask+numpy path."
+            )
+    except (AttributeError, RuntimeError):
+        pass  # no device info available
+
     result = cp.full(out_shape, nodata, dtype=cp.float64)
 
     row_offset = 0