Use cudarc 0.16. (#2900)

* Use cudarc 0.16.

* Allow for disabling event tracking.

* Tweaks.

* Bump the ug version.

* And bump the candle version too.
This commit is contained in:
Laurent Mazare
2025-04-15 21:40:18 +02:00
committed by GitHub
parent b01ebbad8a
commit e4e7b0b2da
7 changed files with 44 additions and 20 deletions

View File

@ -1,6 +1,6 @@
[package]
name = "candle-flash-attn"
version = "0.9.0-alpha.3"
version = "0.9.0-alpha.4"
edition = "2021"
description = "Flash attention layer for the candle ML framework."
@ -11,7 +11,7 @@ license = "MIT OR Apache-2.0"
readme = "README.md"
[dependencies]
candle = { path = "../candle-core", features = ["cuda"], package = "candle-core", version = "0.9.0-alpha.3" }
candle = { path = "../candle-core", features = ["cuda"], package = "candle-core", version = "0.9.0-alpha.4" }
half = { version = "2.3.1", features = ["num-traits"] }
[build-dependencies]