We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent bc4ea53 commit d883ac3Copy full SHA for d883ac3
1 file changed
src/hydrogen/device/rocBLAS_API.cpp
@@ -75,6 +75,10 @@ class ResultMgr
75
H_CHECK_HIP(hipFreeAsync(device_, stream));
76
#endif // HYDROGEN_HAVE_CUB
77
78
+ // Sync stream to match cuBLAS behavior (cuBLAS docs here:
79
+ // https://docs.nvidia.com/cuda/cublas/#scalar-parameters)
80
+ H_CHECK_HIP(hipStreamSynchronize(stream));
81
+
82
// Reset pointer mode
83
H_CHECK_ROCBLAS(rocblas_set_pointer_mode(handle_, rocblas_pointer_mode_host));
84
}
0 commit comments