Add the quantize command. (#624)

* Add the quantize command. * Bugfix for writing gguf files. * And add a comment.
2025-06-19 19:58:35 +00:00 · 2023-08-27 11:35:19 +01:00
parent 6e485f2deb
commit 7151f2cf63
2 changed files with 77 additions and 2 deletions
--- a/candle-core/src/quantized/gguf_file.rs
+++ b/candle-core/src/quantized/gguf_file.rs
@ -292,7 +292,7 @@ impl ValueType {
            7 => Self::Bool,
            8 => Self::String,
            9 => Self::Array,
-            v => crate::bail!("unrecognized value-type {v}"),
+            v => crate::bail!("unrecognized value-type {v:#08x}"),
        };
        Ok(v)
    }
@ -393,6 +393,7 @@ pub fn write<W: std::io::Seek + std::io::Write>(
    w.write_u32::<LittleEndian>(0x46554747)?;
    w.write_u32::<LittleEndian>(1)?; // version 1.
    w.write_u32::<LittleEndian>(tensors.len() as u32)?;
+    w.write_u32::<LittleEndian>(metadata.len() as u32)?;
    for (name, value) in metadata.iter() {
        write_string(w, name)?;
        w.write_u32::<LittleEndian>(value.value_type().to_u32())?;