Llama quantization. (#625)

This commit is contained in:
Laurent Mazare
2023-08-27 14:08:15 +01:00
committed by GitHub
parent 7151f2cf63
commit be471d50ab
2 changed files with 79 additions and 15 deletions

View File

@ -202,6 +202,10 @@ impl QTensor {
self.data.dtype()
}
pub fn rank(&self) -> usize {
self.shape.rank()
}
pub fn shape(&self) -> &Shape {
&self.shape
}