Python example using cupy cuda pointers

anagainaru · anagainaru · commit 55f250aec543 · 2025-02-13T12:59:03.000-05:00
diff --git a/examples/hello/bpStepsWriteReadCuda/bpStepsWriteReadCuda.py b/examples/hello/bpStepsWriteReadCuda/bpStepsWriteReadCuda.py
@@ -0,0 +1,73 @@
+import numpy as np
+import cupy as cp
+from adios2 import FileReader
+import adios2.bindings as adios2
+
+def write_array(fileName, nSteps, gpuArray, cpuArray):
+    adios = adios2.ADIOS()
+    ioWriter = adios.DeclareIO("cupyWriter")
+    # define adios variables, the cpuArray is used for both variables to
+    # define the type of the variables (float32 in this case)
+    gpuVar = ioWriter.DefineVariable("gpuArray", cpuArray, gpuArray.shape,
+                                     [0] * len(gpuArray.shape), gpuArray.shape)
+    # optionally the memory space can be set to GPU
+    gpuVar.SetMemorySpace(adios2.MemorySpace.GPU)
+    cpuVar = ioWriter.DefineVariable("cpuArray", cpuArray, cpuArray.shape,
+                                     [0] * len(cpuArray.shape), cpuArray.shape)
+
+    # write both cpu and gpu arrays for each simulation step
+    wStream = ioWriter.Open(fileName, adios2.Mode.Write)
+    for step in range(nSteps):
+        # write buffers
+        wStream.BeginStep()
+        wStream.Put(cpuVar, cpuArray)
+        wStream.Put(gpuVar, gpuArray.data.ptr)
+        wStream.EndStep()
+        # update buffers
+        gpuArray = gpuArray * 2
+        cpuArray = cpuArray + 1
+    wStream.Close()
+    print("Write to file %s: %s data from GPU and %s data from CPU" % (
+        fileName, gpuArray.shape, cpuArray.shape))
+
+def read_array(fileName, nSteps):
+    adios = adios2.ADIOS()
+    ioReader = adios.DeclareIO("cupyReader")
+    rStream = ioReader.Open(fileName, adios2.Mode.Read)
+    for step in range(nSteps):
+        rStream.BeginStep()
+        # prepare input buffers
+        gpuVar = ioReader.InquireVariable("gpuArray")
+        cpuVar = ioReader.InquireVariable("cpuArray")
+        cpuBuffer = np.zeros(cpuVar.Shape(), dtype=np.float32)
+        gpuShape = gpuVar.Shape(adios2.MemorySpace.GPU)
+        gpuBuffer = cp.zeros(gpuShape, dtype=np.float32)
+        gpuVar.SetSelection([(0, 0), gpuShape])
+        # populate data
+        rStream.Get(gpuVar, gpuBuffer.data.ptr)
+        rStream.Get(cpuVar, cpuBuffer)
+        rStream.EndStep()
+        print("Step %d: read GPU data\n %s" % (step, gpuBuffer))
+        print("Step %d: read CPU data\n %s" % (step, cpuBuffer))
+    rStream.Close()
+
+
+if __name__ == '__main__':
+    # define simulation host data
+    cpuArray = np.array([[0, 1.0, 2.0], [3.0, 4.0, 5.0]], dtype=np.float32)
+    # copy the data on the device
+    gpuArray = cp.asarray(cpuArray)
+    print("Array allocation: ", gpuArray.device)
+
+    mempool = cp.get_default_memory_pool()
+    pinned_mempool = cp.get_default_pinned_memory_pool()
+    print("Bytes required to store the gpu array", gpuArray.nbytes)
+    print("Bytes allocated on the device memory pool", mempool.total_bytes())
+    print("Bytes used on the device memory pool", mempool.used_bytes())
+    print("Blocks allocated on the pinned memory pool (The allocated pinned"
+          " memory is released just after the transfer is complete)",
+          pinned_mempool.n_free_blocks())
+
+    nSteps = 2
+    write_array("StepsWriteReadCuPy.bp", nSteps, gpuArray, cpuArray)
+    read_array("StepsWriteReadCuPy.bp", nSteps)