F16 support for stable diffusion (#488)

* F16 support for stable diffusion. * Keep the attention bits in F32. * Keep more of the attention bits in F32. * More mixed precision support.
2025-06-17 02:58:50 +00:00 · 2023-08-17 13:48:56 +01:00
parent c3176f0dfb
commit 5d99026fd2
6 changed files with 99 additions and 43 deletions
--- a/candle-examples/examples/stable-diffusion/stable_diffusion.rs
+++ b/candle-examples/examples/stable-diffusion/stable_diffusion.rs
@ -159,10 +159,11 @@ impl StableDiffusionConfig {
        &self,
        vae_weights: P,
        device: &Device,
+        dtype: DType,
    ) -> Result<vae::AutoEncoderKL> {
        let weights = unsafe { candle::safetensors::MmapedFile::new(vae_weights)? };
        let weights = weights.deserialize()?;
-        let vs_ae = nn::VarBuilder::from_safetensors(vec![weights], DType::F32, device);
+        let vs_ae = nn::VarBuilder::from_safetensors(vec![weights], dtype, device);
        // https://huggingface.co/runwayml/stable-diffusion-v1-5/blob/main/vae/config.json
        let autoencoder = vae::AutoEncoderKL::new(vs_ae, 3, 3, self.autoencoder.clone())?;
        Ok(autoencoder)
@ -174,10 +175,11 @@ impl StableDiffusionConfig {
        device: &Device,
        in_channels: usize,
        use_flash_attn: bool,
+        dtype: DType,
    ) -> Result<unet_2d::UNet2DConditionModel> {
        let weights = unsafe { candle::safetensors::MmapedFile::new(unet_weights)? };
        let weights = weights.deserialize()?;
-        let vs_unet = nn::VarBuilder::from_safetensors(vec![weights], DType::F32, device);
+        let vs_unet = nn::VarBuilder::from_safetensors(vec![weights], dtype, device);
        let unet = unet_2d::UNet2DConditionModel::new(
            vs_unet,
            in_channels,
@ -196,10 +198,11 @@ impl StableDiffusionConfig {
        &self,
        clip_weights: P,
        device: &Device,
+        dtype: DType,
    ) -> Result<clip::ClipTextTransformer> {
        let weights = unsafe { candle::safetensors::MmapedFile::new(clip_weights)? };
        let weights = weights.deserialize()?;
-        let vs = nn::VarBuilder::from_safetensors(vec![weights], DType::F32, device);
+        let vs = nn::VarBuilder::from_safetensors(vec![weights], dtype, device);
        let text_model = clip::ClipTextTransformer::new(vs, &self.clip)?;
        Ok(text_model)
    }