mirror of
https://github.com/huggingface/candle.git
synced 2025-06-19 03:54:56 +00:00
Add back the bf16 flash-attn kernels. (#730)
This commit is contained in:
@ -146,6 +146,7 @@ impl candle::CustomOp3 for FlashAttn {
|
||||
/* seqlen_q_rounded */ seqlen_q_rounded as u32,
|
||||
/* seqlen_k_rounded */ seqlen_k_rounded as u32,
|
||||
/* is_causal */ causal,
|
||||
/* is_bf16 */ 0,
|
||||
)
|
||||
}
|
||||
|
||||
@ -354,6 +355,7 @@ impl candle::CustomOp3 for FlashAttnVarLen {
|
||||
/* seqlen_q_rounded */ seqlen_q_rounded as u32,
|
||||
/* seqlen_k_rounded */ seqlen_k_rounded as u32,
|
||||
/* is_causal */ causal,
|
||||
/* is_bf16 */ 0,
|
||||
)
|
||||
}
|
||||
|
||||
|
Reference in New Issue
Block a user