Fix dequantization. (#1823)

2025-06-18 11:37:11 +00:00 · 2024-03-08 23:12:13 +01:00
parent 3440cec3a0
commit 936f6a4840
1 changed files with 1 additions and 1 deletions
--- a/candle-core/src/quantized/mod.rs
+++ b/candle-core/src/quantized/mod.rs
@ -398,7 +398,7 @@ impl QMatMul {
            _ => DEQUANTIZE_ALL.with(|b| *b),
        };
        let t = if dequantize {
-            let tensor = qtensor.dequantize(&Device::Cpu)?;
+            let tensor = qtensor.dequantize(&qtensor.device())?;
            Self::Tensor(tensor)
        } else {
            Self::QTensor(qtensor)