{
DeviceInformation deviceInfo;
const DeviceContext deviceContext(deviceInfo);
+ const DeviceStream deviceStream(deviceInfo, deviceContext, DeviceStreamPriority::Normal, false);
const int numElements = h_rVecInput.size();
DeviceBuffer<RVec> d_rVecInput;
allocateDeviceBuffer(&d_rVecInput, numElements, deviceContext);
- copyToDeviceBuffer(&d_rVecInput, h_rVecInput.data(), 0, numElements, nullptr,
+ copyToDeviceBuffer(&d_rVecInput, h_rVecInput.data(), 0, numElements, deviceStream,
GpuApiCallBehavior::Sync, nullptr);
DeviceBuffer<float3> d_float3Output;
kernelLaunchConfig.blockSize[1] = 1;
kernelLaunchConfig.blockSize[2] = 1;
kernelLaunchConfig.sharedMemorySize = 0;
- kernelLaunchConfig.stream = nullptr;
+ kernelLaunchConfig.stream = deviceStream.stream();
auto kernelPtr = convertRVecToFloat3OnDevice_kernel;
const auto kernelArgs = prepareGpuKernelArguments(kernelPtr, kernelLaunchConfig,
&d_float3Output, &d_rVecInput, &numElements);
launchGpuKernel(kernelPtr, kernelLaunchConfig, nullptr, "convertRVecToFloat3OnDevice_kernel", kernelArgs);
- copyFromDeviceBuffer(h_float3Output.data(), &d_float3Output, 0, numElements, nullptr,
+ copyFromDeviceBuffer(h_float3Output.data(), &d_float3Output, 0, numElements, deviceStream,
GpuApiCallBehavior::Sync, nullptr);
saveFloat3InRVecFormat(h_rVecOutput, h_float3Output.data(), numElements);