Add the f16 sum kernel.

This commit is contained in:
laurent
2023-06-26 22:01:29 +01:00
parent d204f1c7c0
commit 93e24f29f4

View File

@ -43,6 +43,10 @@ extern "C" __global__ void FN_NAME( \
} \
} \
#if __CUDA_ARCH__ >= 530
SUM_OP(float, sum_f32)
#endif
SUM_OP(float, sum_f32)
SUM_OP(double, sum_f64)
SUM_OP(uint32_t, sum_u32)