Quantized version of the metavoice model. (#1824)

* Quantized version of the metavoice model. * Integrate the quantized version of metavoice.
2025-06-22 20:38:06 +00:00 · 2024-03-09 11:06:04 +01:00
parent 936f6a4840
commit dd00482ea3
5 changed files with 277 additions and 12 deletions
--- a/candle-transformers/src/quantized_nn.rs
+++ b/candle-transformers/src/quantized_nn.rs
@ -50,6 +50,16 @@ impl Module for Linear {
    }
 }

+pub fn linear_b(in_dim: usize, out_dim: usize, bias: bool, vb: VarBuilder) -> Result<Linear> {
+    let bias = if bias {
+        Some(vb.get(out_dim, "bias")?.dequantize(vb.device())?)
+    } else {
+        None
+    };
+    let weight = QMatMul::new(in_dim, out_dim, vb)?;
+    Ok(Linear { weight, bias })
+}
+
 pub fn linear(in_dim: usize, out_dim: usize, vb: VarBuilder) -> Result<Linear> {
    let bias = vb.get(out_dim, "bias")?.dequantize(vb.device())?;
    let weight = QMatMul::new(in_dim, out_dim, vb)?;