Fix dequantization. (#1823)

This commit is contained in:
Laurent Mazare
2024-03-08 23:12:13 +01:00
committed by GitHub
parent 3440cec3a0
commit 936f6a4840

View File

@ -398,7 +398,7 @@ impl QMatMul {
_ => DEQUANTIZE_ALL.with(|b| *b), _ => DEQUANTIZE_ALL.with(|b| *b),
}; };
let t = if dequantize { let t = if dequantize {
let tensor = qtensor.dequantize(&Device::Cpu)?; let tensor = qtensor.dequantize(&qtensor.device())?;
Self::Tensor(tensor) Self::Tensor(tensor)
} else { } else {
Self::QTensor(qtensor) Self::QTensor(qtensor)