add quantized qwen2 (#2329)

* add quantized version of qwen2 and corresponding example for qwen2-instruct

* fix quantized qwen2 clippy error
This commit is contained in:
Zhuo Jinggang
2024-07-12 16:00:03 +08:00
committed by GitHub
parent a226a9736b
commit c63048d374
4 changed files with 641 additions and 0 deletions

View File

@ -47,6 +47,7 @@ pub mod quantized_moondream;
pub mod quantized_mpt;
pub mod quantized_phi;
pub mod quantized_phi3;
pub mod quantized_qwen2;
pub mod quantized_recurrent_gemma;
pub mod quantized_rwkv_v5;
pub mod quantized_rwkv_v6;