mirror of
https://github.com/huggingface/candle.git
synced 2025-06-15 18:28:24 +00:00
Improve the quantized whisper setup. (#1018)
* Improve the quantized whisper setup. * Fix the config file paths. * Use the standard matmul where possible.
This commit is contained in:
@ -867,7 +867,7 @@ impl PyQTensor {
|
||||
/// Performs a quantized matrix multiplication, with the quantized tensor as the right hand side.
|
||||
/// &RETURNS&: Tensor
|
||||
fn matmul_t(&self, lhs: &PyTensor) -> PyResult<PyTensor> {
|
||||
let qmatmul = ::candle::quantized::QMatMul::from_arc(self.0.clone());
|
||||
let qmatmul = ::candle::quantized::QMatMul::from_arc(self.0.clone()).map_err(wrap_err)?;
|
||||
let res = qmatmul.forward(lhs).map_err(wrap_err)?;
|
||||
Ok(PyTensor(res))
|
||||
}
|
||||
|
Reference in New Issue
Block a user