Tensor -> QTensor conversion (#496)

* Sketch some qmatmul test. * Add the quantization function. * More testing. * Make the test smaller and faster. * Add some shape checking.
2025-06-16 10:38:54 +00:00 · 2023-08-18 08:19:20 +01:00
parent 26fd37b348
commit a22b1bed7b
4 changed files with 87 additions and 7 deletions
--- a/candle-core/examples/cpu_benchmarks.rs
+++ b/candle-core/examples/cpu_benchmarks.rs
@ -90,7 +90,7 @@ impl Benchmark for QMatMul {
    type RunResult = Tensor;
    fn preprocess() -> Result<Self::PreProcessData> {
        let zeros = vec![candle_core::quantized::k_quants::BlockQ4_0::zeros(); 4096 * 11008 / 32];
-        let mm = candle_core::quantized::QTensor::new(zeros, (4096, 11008));
+        let mm = candle_core::quantized::QTensor::new(zeros, (4096, 11008))?;
        let mm = candle_core::quantized::QMatMul::from_qtensor(mm);
        let arg = Tensor::randn(0f32, 1., (128, 11008), &Device::Cpu)?;
        Ok((mm, arg))