Fix the quantized mistral example. (#1478)

This commit is contained in:
Laurent Mazare
2023-12-25 09:31:24 +01:00
committed by GitHub
parent 88589d8815
commit 7135791dd5
2 changed files with 14 additions and 4 deletions

View File

@ -41,7 +41,7 @@ impl VersionedMagic {
(Magic::Gguf, 1) => Self::GgufV1, (Magic::Gguf, 1) => Self::GgufV1,
(Magic::Gguf, 2) => Self::GgufV2, (Magic::Gguf, 2) => Self::GgufV2,
(Magic::Gguf, 3) => Self::GgufV3, (Magic::Gguf, 3) => Self::GgufV3,
_ => crate::bail!("ggml: unsupported magic/version {magic:?}/{version}"), _ => crate::bail!("gguf: unsupported magic/version {magic:?}/{version}"),
}; };
Ok(versioned_magic) Ok(versioned_magic)
} }

View File

@ -155,8 +155,8 @@ struct Args {
#[arg(long, short = 'n', default_value_t = 100)] #[arg(long, short = 'n', default_value_t = 100)]
sample_len: usize, sample_len: usize,
#[arg(long, default_value = "mistralai/Mistral-7B-v0.1")] #[arg(long)]
model_id: String, model_id: Option<String>,
#[arg(long, default_value = "main")] #[arg(long, default_value = "main")]
revision: String, revision: String,
@ -207,8 +207,18 @@ fn main() -> Result<()> {
let start = std::time::Instant::now(); let start = std::time::Instant::now();
let api = Api::new()?; let api = Api::new()?;
let model_id = match args.model_id {
Some(model_id) => model_id,
None => {
if args.quantized {
"lmz/candle-mistral".to_string()
} else {
"mistralai/Mistral-7B-v0.1".to_string()
}
}
};
let repo = api.repo(Repo::with_revision( let repo = api.repo(Repo::with_revision(
args.model_id, model_id,
RepoType::Model, RepoType::Model,
args.revision, args.revision,
)); ));