mirror of
https://github.com/huggingface/candle.git
synced 2025-06-16 02:38:10 +00:00
Release the mmdit model earlier to reduce memory usage. (#2581)
* Stable diffusion 3.5 support. * Clippy fixes. * CFG fix. * Remove some unnecessary clones. * Avoid duplicating some of the code. * Release the mmdit model earlier to reduce memory usage.
This commit is contained in:
@ -183,17 +183,17 @@ fn main() -> Result<()> {
|
||||
let context = Tensor::cat(&[context, context_uncond], 0)?;
|
||||
let y = Tensor::cat(&[y, y_uncond], 0)?;
|
||||
|
||||
if let Some(seed) = seed {
|
||||
device.set_seed(seed)?;
|
||||
}
|
||||
let start_time = std::time::Instant::now();
|
||||
let x = {
|
||||
let mmdit = MMDiT::new(
|
||||
&mmdit_config,
|
||||
use_flash_attn,
|
||||
vb.pp("model.diffusion_model"),
|
||||
)?;
|
||||
|
||||
if let Some(seed) = seed {
|
||||
device.set_seed(seed)?;
|
||||
}
|
||||
let start_time = std::time::Instant::now();
|
||||
let x = sampling::euler_sample(
|
||||
sampling::euler_sample(
|
||||
&mmdit,
|
||||
&y,
|
||||
&context,
|
||||
@ -202,7 +202,8 @@ fn main() -> Result<()> {
|
||||
time_shift,
|
||||
height,
|
||||
width,
|
||||
)?;
|
||||
)?
|
||||
};
|
||||
let dt = start_time.elapsed().as_secs_f32();
|
||||
println!(
|
||||
"Sampling done. {num_inference_steps} steps. {:.2}s. Average rate: {:.2} iter/s",
|
||||
|
Reference in New Issue
Block a user