Single-Thread + Single-Stream
import acl # ...... # Explicitly create a stream. stream, ret = acl.rt.create_stream() # Pass the stream argument to the task triggering call. acl.rt.memcpy_async(devPtr, devSize, hostPtr, hostSize, ACL_MEMCPY_HOST_TO_DEVICE, stream) # Call acl.rt.synchronize_stream to block the application until all tasks in the specified stream are complete. acl.rt.synchronize_stream(stream) # Explicitly destroy the stream after using the stream. acl.rt.destroy_stream(stream) # ......