From 53fdbda683ea42947a51addffebbe369474159e8 Mon Sep 17 00:00:00 2001 From: laurent Date: Mon, 26 Jun 2023 22:02:22 +0100 Subject: [PATCH] Add the f16 sum kernel (fix). --- kernels/src/reduce.cu | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/kernels/src/reduce.cu b/kernels/src/reduce.cu index 76dbbdc3..e1ed57ab 100644 --- a/kernels/src/reduce.cu +++ b/kernels/src/reduce.cu @@ -44,7 +44,7 @@ extern "C" __global__ void FN_NAME( \ } \ #if __CUDA_ARCH__ >= 530 -SUM_OP(float, sum_f32) +SUM_OP(__half, sum_f16) #endif SUM_OP(float, sum_f32)