mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 10:38:54 +00:00
Llama bugfix.
This commit is contained in:
@ -300,7 +300,7 @@ impl CausalSelfAttention {
|
||||
let att = att.softmax(att.rank() - 1)?;
|
||||
// Convert to contiguous as matmul doesn't support strided vs for now.
|
||||
let y = att.matmul(&v.contiguous()?)?;
|
||||
let y = y.transpose(1, 2)?.reshape(&[t, c])?;
|
||||
let y = y.transpose(0, 1)?.reshape(&[t, c])?;
|
||||
let y = self.c_proj.forward(&y)?;
|
||||
Ok(y)
|
||||
}
|
||||
|
Reference in New Issue
Block a user