mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 10:38:54 +00:00
Fix the quantized example. (#564)
This commit is contained in:
@ -605,8 +605,8 @@ fn main() -> anyhow::Result<()> {
|
||||
);
|
||||
println!("params: {:?}", model.hparams);
|
||||
let default_gqa = match args.which {
|
||||
Which::L7b | Which::L13b => 1,
|
||||
Which::L70b => 8,
|
||||
Which::L7b | Which::L13b | Which::L7bChat | Which::L13bChat => 1,
|
||||
Which::L70b | Which::L70bChat => 8,
|
||||
};
|
||||
ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))?
|
||||
}
|
||||
|
Reference in New Issue
Block a user