mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 10:38:54 +00:00
Add quantized tensors. (#458)
* Add quantized tensors. * Implement the debug trait for QTensor. * Add the QMatMul custom op.
This commit is contained in:
@ -3,7 +3,6 @@ use clap::Parser;
|
||||
use std::fs::File;
|
||||
|
||||
use candle::quantized::ggml_file::Content;
|
||||
use candle::{DType, Device};
|
||||
|
||||
#[derive(Parser, Debug)]
|
||||
#[command(author, version, about, long_about = None)]
|
||||
@ -18,7 +17,7 @@ fn main() -> Result<()> {
|
||||
|
||||
let mut file = File::open(args.model)?;
|
||||
let start = std::time::Instant::now();
|
||||
let model = Content::read(&mut file, DType::F16, &Device::Cpu)?;
|
||||
let model = Content::read(&mut file)?;
|
||||
|
||||
println!(
|
||||
"Loaded {:?} tensors in {:?}",
|
||||
|
Reference in New Issue
Block a user