Skip to content

Commit bd9f5fa

Browse files
authored
Updating CUDA_WAIT_ALL to CUDA_WAIT_READ
1 parent 245afd1 commit bd9f5fa

1 file changed

Lines changed: 2 additions & 4 deletions

File tree

src/gpuarray_blas_cuda_cublas.c

Lines changed: 2 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -835,8 +835,7 @@ static int sgemmBatch(cb_order order, cb_transpose transA, cb_transpose transB,
835835
return ctx->err->code;
836836
}
837837

838-
// added cuda_wait
839-
GA_CUDA_EXIT_ON_ERROR(ctx, cuda_wait(Ta, CUDA_WAIT_ALL));
838+
GA_CUDA_EXIT_ON_ERROR(ctx, cuda_wait(Ta, CUDA_WAIT_READ));
840839

841840
err = cublasSgemmBatched(h->h,
842841
convT(transA), convT(transB),
@@ -965,8 +964,7 @@ static int dgemmBatch(cb_order order, cb_transpose transA, cb_transpose transB,
965964
return ctx->err->code;
966965
}
967966

968-
// added cuda_wait
969-
GA_CUDA_EXIT_ON_ERROR(ctx, cuda_wait(Ta, CUDA_WAIT_ALL));
967+
GA_CUDA_EXIT_ON_ERROR(ctx, cuda_wait(Ta, CUDA_WAIT_READ));
970968

971969
err = cublasDgemmBatched(h->h,
972970
convT(transA), convT(transB),

0 commit comments

Comments
 (0)