From 0f4ff8a739facafd4b3bc9a003d4a581202b62f8 Mon Sep 17 00:00:00 2001 From: Laurent Mazare Date: Wed, 23 Aug 2023 11:09:55 +0100 Subject: [PATCH] Fix the quantized example. (#564) --- candle-examples/examples/quantized/main.rs | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/candle-examples/examples/quantized/main.rs b/candle-examples/examples/quantized/main.rs index c4be8974..dfe81632 100644 --- a/candle-examples/examples/quantized/main.rs +++ b/candle-examples/examples/quantized/main.rs @@ -605,8 +605,8 @@ fn main() -> anyhow::Result<()> { ); println!("params: {:?}", model.hparams); let default_gqa = match args.which { - Which::L7b | Which::L13b => 1, - Which::L70b => 8, + Which::L7b | Which::L13b | Which::L7bChat | Which::L13bChat => 1, + Which::L70b | Which::L70bChat => 8, }; ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))? }