Llama quantization. (#625)

2025-06-19 11:56:45 +00:00 · 2023-08-27 14:08:15 +01:00
parent 7151f2cf63
commit be471d50ab
2 changed files with 79 additions and 15 deletions
--- a/candle-core/src/quantized/mod.rs
+++ b/candle-core/src/quantized/mod.rs
@ -202,6 +202,10 @@ impl QTensor {
        self.data.dtype()
    }

+    pub fn rank(&self) -> usize {
+        self.shape.rank()
+    }
+
    pub fn shape(&self) -> &Shape {
        &self.shape
    }