Add the bf16 cuda kernels.

This commit is contained in:
laurent
2023-06-29 23:12:02 +01:00
parent 018e017e7e
commit ec79fc43f2
9 changed files with 67 additions and 1 deletions

View File

@ -1,4 +1,5 @@
#include "cuda_fp16.h"
#include "cuda_bf16.h"
// Table showing which features are supported on which compute capability
// https://docs.nvidia.com/cuda/cuda-c-programming-guide/#features-and-technical-specifications