mirror of
https://github.com/huggingface/candle.git
synced 2025-06-17 11:08:52 +00:00
Compare commits
1 Commits
0.7.2
...
llama-v3-m
Author | SHA1 | Date | |
---|---|---|---|
6d6d87f8b3 |
@ -120,7 +120,10 @@ fn main() -> Result<()> {
|
|||||||
Some("bf16") => DType::BF16,
|
Some("bf16") => DType::BF16,
|
||||||
Some("f32") => DType::F32,
|
Some("f32") => DType::F32,
|
||||||
Some(dtype) => bail!("Unsupported dtype {dtype}"),
|
Some(dtype) => bail!("Unsupported dtype {dtype}"),
|
||||||
None => DType::F16,
|
None => match args.which {
|
||||||
|
Which::V3 | Which::V3Instruct => DType::BF16,
|
||||||
|
Which::V1 | Which::V2 | Which::Solar10_7B | Which::TinyLlama1_1BChat => DType::F16,
|
||||||
|
},
|
||||||
};
|
};
|
||||||
let (llama, tokenizer_filename, mut cache, config) = {
|
let (llama, tokenizer_filename, mut cache, config) = {
|
||||||
let api = Api::new()?;
|
let api = Api::new()?;
|
||||||
|
Reference in New Issue
Block a user