More model cloning. (#1126)

* More model cloning. * More cloning on quantized models.
2025-06-18 19:47:12 +00:00 · 2023-10-18 21:55:46 +01:00
parent 185b54a33b
commit 902d0b9166
4 changed files with 19 additions and 19 deletions
--- a/candle-transformers/src/models/quantized_mpt.rs
+++ b/candle-transformers/src/models/quantized_mpt.rs
@ -7,7 +7,7 @@ use candle_nn::LayerNorm;

 pub use super::mpt::Config;

-#[derive(Debug)]
+#[derive(Debug, Clone)]
 struct GroupedQueryAttention {
    wqkv: Linear,
    out_proj: Linear,
@ -101,7 +101,7 @@ impl GroupedQueryAttention {
    }
 }

-#[derive(Debug)]
+#[derive(Debug, Clone)]
 struct Ffn {
    up_proj: Linear,
    down_proj: Linear,
@ -122,7 +122,7 @@ impl Module for Ffn {
    }
 }

-#[derive(Debug)]
+#[derive(Debug, Clone)]
 struct MPTBlock {
    norm1: LayerNorm, // Do we need the low-precision variant?
    attn: GroupedQueryAttention,
@ -155,7 +155,7 @@ impl MPTBlock {
    }
 }

-#[derive(Debug)]
+#[derive(Debug, Clone)]
 pub struct Model {
    wte: Embedding,
    blocks: Vec<MPTBlock>,