Improve the quantized whisper setup. (#1018)

* Improve the quantized whisper setup. * Fix the config file paths. * Use the standard matmul where possible.
2025-06-15 18:28:24 +00:00 · 2023-10-02 17:17:46 +01:00
parent e04c789230
commit 089fc3b584
8 changed files with 66 additions and 49 deletions
--- a/candle-pyo3/src/lib.rs
+++ b/candle-pyo3/src/lib.rs
@ -867,7 +867,7 @@ impl PyQTensor {
    /// Performs a quantized matrix multiplication, with the quantized tensor as the right hand side.
    /// &RETURNS&: Tensor
    fn matmul_t(&self, lhs: &PyTensor) -> PyResult<PyTensor> {
-        let qmatmul = ::candle::quantized::QMatMul::from_arc(self.0.clone());
+        let qmatmul = ::candle::quantized::QMatMul::from_arc(self.0.clone()).map_err(wrap_err)?;
        let res = qmatmul.forward(lhs).map_err(wrap_err)?;
        Ok(PyTensor(res))
    }