Add a couple cuda kernels from dfdx.

2025-06-20 04:00:28 +00:00 · 2023-06-22 12:56:29 +01:00
parent 625e08d6ab
commit 4b1c3405e9
9 changed files with 501 additions and 0 deletions
--- a/kernels/src/binary_mul.cu
+++ b/kernels/src/binary_mul.cu
@ -0,0 +1,21 @@
+#include "binary_op_macros.cuh"
+
+struct BinaryMulKernalOp {};
+
+#if __CUDA_ARCH__ >= 530
+BINARY_OP(__half, bmul_fwd_f16, bmul_bwd_lhs_f16, bmul_bwd_rhs_f16, BinaryMulKernalOp,
+    x * y,
+    y,
+    x)
+#endif
+
+BINARY_OP(float, bmul_fwd_f32, bmul_bwd_lhs_f32, bmul_bwd_rhs_f32, BinaryMulKernalOp,
+    x * y,
+    y,
+    x)
+
+BINARY_OP(double, bmul_fwd_f64, bmul_bwd_lhs_f64, bmul_bwd_rhs_f64, BinaryMulKernalOp,
+    x * y,
+    y,
+    x)
+