mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 18:48:51 +00:00
Fix mistral attention on Metal (#2699)
Co-authored-by: Luka Zakrajsek <luka.zakrajsek@soniox.com>
This commit is contained in:
@ -262,7 +262,8 @@ impl Attention {
|
|||||||
.contiguous()?;
|
.contiguous()?;
|
||||||
let value_states = value_states
|
let value_states = value_states
|
||||||
.reshape((b_sz, q_len, self.num_kv_heads, self.head_dim))?
|
.reshape((b_sz, q_len, self.num_kv_heads, self.head_dim))?
|
||||||
.transpose(1, 2)?;
|
.transpose(1, 2)?
|
||||||
|
.contiguous()?;
|
||||||
|
|
||||||
let (query_states, key_states) =
|
let (query_states, key_states) =
|
||||||
self.rotary_emb
|
self.rotary_emb
|
||||||
|
Reference in New Issue
Block a user