test(cuda.core): query all buffers before closing in test_batched_same_advice

rparolin · claude · rparolin · commit e0c782a547d4 · 2026-04-28T10:42:14.000-07:00
On CUDA 12, freeing one managed allocation appears to clear the
read-mostly advice on neighboring ranges. The original test interleaved
query-then-close inside one loop, so the second iteration would query
bufs[1] *after* bufs[0] had been freed and observe a cleared advice
flag — causing assert 0 == 1.

Move the queries into a list comprehension that runs before any close,
then close all buffers, then assert. Decouples the verification from
the deallocation order.

CUDA 13 was unaffected because its managed-memory bookkeeping does not
exhibit the cross-range invalidation on free.

Co-Authored-By: Claude Opus 4.7 (1M context) &lt;noreply@anthropic.com&gt;
diff --git a/cuda_core/tests/test_memory.py b/cuda_core/tests/test_memory.py
@@ -2245,15 +2245,21 @@ def test_batched_same_advice(self, init_cuda):
         mr = DummyUnifiedMemoryResource(device)
         bufs = [mr.allocate(_MANAGED_TEST_ALLOCATION_SIZE) for _ in range(2)]
         advise(bufs, "set_read_mostly")
-        for buf in bufs:
-            assert (
-                _get_int_mem_range_attr(
-                    buf,
-                    driver.CUmem_range_attribute.CU_MEM_RANGE_ATTRIBUTE_READ_MOSTLY,
-                )
-                == _READ_MOSTLY_ENABLED
+        # Query all attributes BEFORE closing any buffer. On CUDA 12, freeing
+        # a managed allocation can clear read-mostly advice on neighboring
+        # ranges; close-then-query in a single loop falsely flags the later
+        # iterations as having lost the advice.
+        results = [
+            _get_int_mem_range_attr(
+                buf,
+                driver.CUmem_range_attribute.CU_MEM_RANGE_ATTRIBUTE_READ_MOSTLY,
             )
+            for buf in bufs
+        ]
+        for buf in bufs:
             buf.close()
+        for r in results:
+            assert r == _READ_MOSTLY_ENABLED
 
     def test_batched_per_buffer_location(self, init_cuda):
         from cuda.core.utils import Location, advise