mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 18:48:51 +00:00
Fix the quantized mistral example. (#1478)
This commit is contained in:
@ -41,7 +41,7 @@ impl VersionedMagic {
|
|||||||
(Magic::Gguf, 1) => Self::GgufV1,
|
(Magic::Gguf, 1) => Self::GgufV1,
|
||||||
(Magic::Gguf, 2) => Self::GgufV2,
|
(Magic::Gguf, 2) => Self::GgufV2,
|
||||||
(Magic::Gguf, 3) => Self::GgufV3,
|
(Magic::Gguf, 3) => Self::GgufV3,
|
||||||
_ => crate::bail!("ggml: unsupported magic/version {magic:?}/{version}"),
|
_ => crate::bail!("gguf: unsupported magic/version {magic:?}/{version}"),
|
||||||
};
|
};
|
||||||
Ok(versioned_magic)
|
Ok(versioned_magic)
|
||||||
}
|
}
|
||||||
|
@ -155,8 +155,8 @@ struct Args {
|
|||||||
#[arg(long, short = 'n', default_value_t = 100)]
|
#[arg(long, short = 'n', default_value_t = 100)]
|
||||||
sample_len: usize,
|
sample_len: usize,
|
||||||
|
|
||||||
#[arg(long, default_value = "mistralai/Mistral-7B-v0.1")]
|
#[arg(long)]
|
||||||
model_id: String,
|
model_id: Option<String>,
|
||||||
|
|
||||||
#[arg(long, default_value = "main")]
|
#[arg(long, default_value = "main")]
|
||||||
revision: String,
|
revision: String,
|
||||||
@ -207,8 +207,18 @@ fn main() -> Result<()> {
|
|||||||
|
|
||||||
let start = std::time::Instant::now();
|
let start = std::time::Instant::now();
|
||||||
let api = Api::new()?;
|
let api = Api::new()?;
|
||||||
|
let model_id = match args.model_id {
|
||||||
|
Some(model_id) => model_id,
|
||||||
|
None => {
|
||||||
|
if args.quantized {
|
||||||
|
"lmz/candle-mistral".to_string()
|
||||||
|
} else {
|
||||||
|
"mistralai/Mistral-7B-v0.1".to_string()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
};
|
||||||
let repo = api.repo(Repo::with_revision(
|
let repo = api.repo(Repo::with_revision(
|
||||||
args.model_id,
|
model_id,
|
||||||
RepoType::Model,
|
RepoType::Model,
|
||||||
args.revision,
|
args.revision,
|
||||||
));
|
));
|
||||||
|
Reference in New Issue
Block a user