mirror of
https://github.com/huggingface/candle.git
synced 2025-06-18 11:37:11 +00:00
Fix dequantization. (#1823)
This commit is contained in:
@ -398,7 +398,7 @@ impl QMatMul {
|
|||||||
_ => DEQUANTIZE_ALL.with(|b| *b),
|
_ => DEQUANTIZE_ALL.with(|b| *b),
|
||||||
};
|
};
|
||||||
let t = if dequantize {
|
let t = if dequantize {
|
||||||
let tensor = qtensor.dequantize(&Device::Cpu)?;
|
let tensor = qtensor.dequantize(&qtensor.device())?;
|
||||||
Self::Tensor(tensor)
|
Self::Tensor(tensor)
|
||||||
} else {
|
} else {
|
||||||
Self::QTensor(qtensor)
|
Self::QTensor(qtensor)
|
||||||
|
Reference in New Issue
Block a user