mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 10:38:54 +00:00
Streaming mode for reporting the generated tokens (#1007)
* Token streaming. * Use the token output stream. * Flush the output. * Ensure that the last characters get reported.
This commit is contained in:
@ -25,6 +25,7 @@ rayon = { workspace = true }
|
||||
safetensors = { workspace = true }
|
||||
serde = { workspace = true }
|
||||
serde_json = { workspace = true }
|
||||
tokenizers = { workspace = true, features = ["onig"] }
|
||||
|
||||
[dev-dependencies]
|
||||
anyhow = { workspace = true }
|
||||
@ -35,7 +36,6 @@ imageproc = { workspace = true }
|
||||
memmap2 = { workspace = true }
|
||||
rand = { workspace = true }
|
||||
rusttype = { workspace = true }
|
||||
tokenizers = { workspace = true, features = ["onig"] }
|
||||
tracing = { workspace = true }
|
||||
tracing-chrome = { workspace = true }
|
||||
tracing-subscriber = { workspace = true }
|
||||
|
Reference in New Issue
Block a user