mirror of
https://github.com/huggingface/candle.git
synced 2025-06-17 11:08:52 +00:00
Fix the quantized example. (#564)
This commit is contained in:
@ -605,8 +605,8 @@ fn main() -> anyhow::Result<()> {
|
|||||||
);
|
);
|
||||||
println!("params: {:?}", model.hparams);
|
println!("params: {:?}", model.hparams);
|
||||||
let default_gqa = match args.which {
|
let default_gqa = match args.which {
|
||||||
Which::L7b | Which::L13b => 1,
|
Which::L7b | Which::L13b | Which::L7bChat | Which::L13bChat => 1,
|
||||||
Which::L70b => 8,
|
Which::L70b | Which::L70bChat => 8,
|
||||||
};
|
};
|
||||||
ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))?
|
ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))?
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user