Skip to content

Commit a18251f

Browse files
author
abergeron
authored
Merge pull request #528 from dendisuhubdy/patch-cuda-race-condition
CUDA race conditions
2 parents ae79a3c + bd9f5fa commit a18251f

1 file changed

Lines changed: 4 additions & 0 deletions

File tree

src/gpuarray_blas_cuda_cublas.c

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -835,6 +835,8 @@ static int sgemmBatch(cb_order order, cb_transpose transA, cb_transpose transB,
835835
return ctx->err->code;
836836
}
837837

838+
GA_CUDA_EXIT_ON_ERROR(ctx, cuda_wait(Ta, CUDA_WAIT_READ));
839+
838840
err = cublasSgemmBatched(h->h,
839841
convT(transA), convT(transB),
840842
M, N, K, &alpha,
@@ -962,6 +964,8 @@ static int dgemmBatch(cb_order order, cb_transpose transA, cb_transpose transB,
962964
return ctx->err->code;
963965
}
964966

967+
GA_CUDA_EXIT_ON_ERROR(ctx, cuda_wait(Ta, CUDA_WAIT_READ));
968+
965969
err = cublasDgemmBatched(h->h,
966970
convT(transA), convT(transB),
967971
M, N, K, &alpha,

0 commit comments

Comments
 (0)