mirror of
https://github.com/huggingface/candle.git
synced 2025-06-18 03:28:50 +00:00
Ignore rotary.
This commit is contained in:
@ -199,7 +199,10 @@ impl MHA {
|
||||
Some((prev_k, _)) => prev_k.dim(1)?,
|
||||
};
|
||||
// In the python implementation, a single tensor is returned with the third axis of size 3.
|
||||
let (q, k, v) = self.rotary_emb.apply_rotary_emb_qkv(&qkv, seqlen_offset)?;
|
||||
// let (q, k, v) = self.rotary_emb.apply_rotary_emb_qkv(&qkv, seqlen_offset)?;
|
||||
let q = qkv.i((.., .., 0))?;
|
||||
let k = qkv.i((.., .., 1))?;
|
||||
let v = qkv.i((.., .., 2))?;
|
||||
let (k, v) = match &self.kv_cache {
|
||||
None => (k, v),
|
||||
Some((prev_k, prev_v)) => {
|
||||
|
Reference in New Issue
Block a user