mirror of
https://github.com/huggingface/candle.git
synced 2025-06-17 19:18:50 +00:00
@ -19,7 +19,7 @@ byteorder = "1.4.3"
|
|||||||
clap = { version = "4.2.4", features = ["derive"] }
|
clap = { version = "4.2.4", features = ["derive"] }
|
||||||
# Re-enable this once 0.9.13 as been released as it would include the cublas-f16 changes
|
# Re-enable this once 0.9.13 as been released as it would include the cublas-f16 changes
|
||||||
# cudarc = { version = "0.9.13", optional = true, features = ["f16"] }
|
# cudarc = { version = "0.9.13", optional = true, features = ["f16"] }
|
||||||
cudarc = { git = "https://github.com/coreylowman/cudarc.git", features = ["f16", "nccl"] }
|
cudarc = { git = "https://github.com/coreylowman/cudarc.git", features = ["f16"] }
|
||||||
# TODO: Switch back to the official gemm implementation once the following are available.
|
# TODO: Switch back to the official gemm implementation once the following are available.
|
||||||
# https://github.com/sarah-ek/gemm/pull/8.
|
# https://github.com/sarah-ek/gemm/pull/8.
|
||||||
# https://github.com/sarah-ek/gemm/pull/9.
|
# https://github.com/sarah-ek/gemm/pull/9.
|
||||||
|
@ -42,7 +42,7 @@ default = []
|
|||||||
cuda = ["candle/cuda", "candle-nn/cuda", "candle-transformers/cuda"]
|
cuda = ["candle/cuda", "candle-nn/cuda", "candle-transformers/cuda"]
|
||||||
flash-attn = ["cuda", "dep:candle-flash-attn"]
|
flash-attn = ["cuda", "dep:candle-flash-attn"]
|
||||||
mkl = ["dep:intel-mkl-src", "candle/mkl", "candle-nn/mkl", "candle-transformers/mkl"]
|
mkl = ["dep:intel-mkl-src", "candle/mkl", "candle-nn/mkl", "candle-transformers/mkl"]
|
||||||
nccl = ["dep:cudarc", "dep:half"]
|
nccl = ["cuda", "cudarc/nccl", "dep:half"]
|
||||||
|
|
||||||
[[example]]
|
[[example]]
|
||||||
name = "llama_multiprocess"
|
name = "llama_multiprocess"
|
||||||
|
Reference in New Issue
Block a user