Expose some helper functions to create quantized models. (#1837)

2025-06-22 20:38:06 +00:00 · 2024-03-12 11:30:24 +01:00
parent df5f69444e
commit ff03fd3fb3
3 changed files with 15 additions and 0 deletions
--- a/candle-transformers/src/quantized_nn.rs
+++ b/candle-transformers/src/quantized_nn.rs
@ -35,6 +35,14 @@ pub struct Linear {
 }

 impl Linear {
+    pub fn from_arc(
+        weight: std::sync::Arc<candle::quantized::QTensor>,
+        bias: Option<Tensor>,
+    ) -> Result<Self> {
+        let weight = QMatMul::from_weights(weight)?;
+        Ok(Self { weight, bias })
+    }
+
    pub fn from_weights(weight: QMatMul, bias: Option<Tensor>) -> Self {
        Self { weight, bias }
    }