Add a quantized version of recurrent-gemma. (#2054)

* Add a quantized version of recurrent-gemma.

* Share the rglru part.

* Get the quantized gemma model to work.
This commit is contained in:
Laurent Mazare
2024-04-13 20:07:01 +02:00
committed by GitHub
parent 4c88c3ce06
commit 50e49ecc5f
6 changed files with 521 additions and 67 deletions

View File

@ -63,7 +63,7 @@ impl VarBuilder {
let path = self.path(name);
match self.data.get(&path) {
None => {
candle::bail!("cannot find tensor {name}")
candle::bail!("cannot find tensor {path}")
}
Some(qtensor) => {
let shape = s.into();