diff --git a/candle-examples/examples/quantized/main.rs b/candle-examples/examples/quantized/main.rs index c4be8974..dfe81632 100644 --- a/candle-examples/examples/quantized/main.rs +++ b/candle-examples/examples/quantized/main.rs @@ -605,8 +605,8 @@ fn main() -> anyhow::Result<()> { ); println!("params: {:?}", model.hparams); let default_gqa = match args.which { - Which::L7b | Which::L13b => 1, - Which::L70b => 8, + Which::L7b | Which::L13b | Which::L7bChat | Which::L13bChat => 1, + Which::L70b | Which::L70bChat => 8, }; ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))? }