Simplify the KvCache api. (#2207)

This commit is contained in:
Laurent Mazare
2024-05-23 17:07:21 +02:00
committed by GitHub
parent 31cf64147b
commit 45e235a747
3 changed files with 54 additions and 44 deletions

View File

@ -217,7 +217,6 @@ fn main() -> anyhow::Result<()> {
match args.which {
Which::Phi2 => Model::Phi2(Phi2::from_gguf(model, &mut file, &device)?),
Which::Phi3 => Model::Phi3(Phi3::from_gguf(
1,
args.use_flash_attn,
model,
&mut file,