Segment-anything fixes: avoid normalizing twice. (#767)

* Segment-anything fixes: avoid normalizing twice. * More fixes for the image aspect ratio.
2025-06-18 03:28:50 +00:00 · 2023-09-07 21:45:16 +01:00
parent 7396b8ed1a
commit 79c27fc489
3 changed files with 33 additions and 3 deletions
--- a/candle-examples/examples/segment-anything/model_sam.rs
+++ b/candle-examples/examples/segment-anything/model_sam.rs
@ -6,7 +6,7 @@ use crate::model_mask_decoder::MaskDecoder;
 use crate::model_prompt_encoder::PromptEncoder;

 const PROMPT_EMBED_DIM: usize = 256;
-const IMAGE_SIZE: usize = 1024;
+pub const IMAGE_SIZE: usize = 1024;
 const VIT_PATCH_SIZE: usize = 16;

 #[derive(Debug)]
@ -90,6 +90,7 @@ impl Sam {
    fn preprocess(&self, img: &Tensor) -> Result<Tensor> {
        let (c, h, w) = img.dims3()?;
        let img = img
+            .to_dtype(DType::F32)?
            .broadcast_sub(&self.pixel_mean)?
            .broadcast_div(&self.pixel_std)?;
        if h > IMAGE_SIZE || w > IMAGE_SIZE {