mirror of
https://github.com/huggingface/candle.git
synced 2025-06-20 20:09:50 +00:00
Add the bf16 cuda kernels.
This commit is contained in:
@ -32,6 +32,10 @@ extern "C" __global__ void FN_NAME( \
|
||||
} \
|
||||
} \
|
||||
|
||||
#if __CUDA_ARCH__ >= 800
|
||||
WHERE_OP(__nv_bfloat16, where_bf16)
|
||||
#endif
|
||||
|
||||
#if __CUDA_ARCH__ >= 530
|
||||
WHERE_OP(__half, where_f16)
|
||||
#endif
|
||||
|
Reference in New Issue
Block a user