mirror of
https://github.com/huggingface/candle.git
synced 2025-06-19 11:56:45 +00:00
Removing the fences speeds everything up and *is* correct this time...
This commit is contained in:
@ -250,7 +250,7 @@ fn main() -> Result<()> {
|
||||
let vb =
|
||||
candle_transformers::quantized_var_builder::VarBuilder::from_gguf(filename, &device)?;
|
||||
let model = QMistral::new(&config, vb)?;
|
||||
(Model::Quantized(model), Device::Cpu)
|
||||
(Model::Quantized(model), device)
|
||||
} else {
|
||||
let dtype = if device.is_cuda() {
|
||||
DType::BF16
|
||||
|
Reference in New Issue
Block a user