Fix dequantization. (#1823)

This commit is contained in:
Laurent Mazare
2024-03-08 23:12:13 +01:00
committed by GitHub
parent 3440cec3a0
commit 936f6a4840

View File

@ -398,7 +398,7 @@ impl QMatMul {
_ => DEQUANTIZE_ALL.with(|b| *b),
};
let t = if dequantize {
let tensor = qtensor.dequantize(&Device::Cpu)?;
let tensor = qtensor.dequantize(&qtensor.device())?;
Self::Tensor(tensor)
} else {
Self::QTensor(qtensor)