Skip to content

Commit 8adcc9e

Browse files
committed
fix determinism
1 parent 550ff94 commit 8adcc9e

1 file changed

Lines changed: 1 addition & 1 deletion

File tree

pufferlib/src/kernels.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ typedef __nv_bfloat16 precision_t;
2626
constexpr bool USE_BF16 = true;
2727
constexpr int PRECISION_SIZE = 2;
2828
static constexpr cudaDataType_t CUBLAS_PRECISION = CUDA_R_16BF;
29-
static constexpr cublasComputeType_t CUBLAS_COMPUTE_PRECISION = CUBLAS_COMPUTE_32F_FAST_16BF;
29+
static constexpr cublasComputeType_t CUBLAS_COMPUTE_PRECISION = CUBLAS_COMPUTE_32F; // Note: fast bf16 is not deterministic
3030
#define NCCL_PRECISION ncclBfloat16
3131
#define to_float(x) __bfloat162float(x)
3232
#define from_float(x) __float2bfloat16(x)

0 commit comments

Comments
 (0)