Fix for the batch dim in the quantized matmul example. (#2073)

* Fix for the batch dim in the quantized matmul example. * Enable more tests on cuda. * Add a test for qmm with a batch. * Fix the zeros-dim test on metal.
2025-06-19 11:56:45 +00:00 · 2024-04-15 20:00:28 +02:00
parent af955f260c
commit f135b7963d
3 changed files with 38 additions and 38 deletions
--- a/candle-core/src/metal_backend/device.rs
+++ b/candle-core/src/metal_backend/device.rs
@ -283,5 +283,5 @@ impl MetalDevice {
 }

 fn buf_size(size: NSUInteger) -> NSUInteger {
-    (size - 1).next_power_of_two() as NSUInteger
+    size.saturating_sub(1).next_power_of_two() as NSUInteger
 }
--- a/candle-core/src/quantized/cuda.rs
+++ b/candle-core/src/quantized/cuda.rs
@ -464,7 +464,7 @@ impl QCudaStorage {
                /* x_rows */ n,
                /* x_cols */ k,
                /* y_rows */ k,
-                /* y_cols */ m,
+                /* y_cols */ b * m,
                self.device(),
            )?
        };