Fix the quantized example. (#564)

This commit is contained in:
Laurent Mazare
2023-08-23 11:09:55 +01:00
committed by GitHub
parent 89a00b56cc
commit 0f4ff8a739

View File

@ -605,8 +605,8 @@ fn main() -> anyhow::Result<()> {
);
println!("params: {:?}", model.hparams);
let default_gqa = match args.which {
Which::L7b | Which::L13b => 1,
Which::L70b => 8,
Which::L7b | Which::L13b | Which::L7bChat | Which::L13bChat => 1,
Which::L70b | Which::L70bChat => 8,
};
ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))?
}