diff --git a/candle-transformers/src/models/quantized_t5.rs b/candle-transformers/src/models/quantized_t5.rs index 7f7d53dd..5f08c67d 100644 --- a/candle-transformers/src/models/quantized_t5.rs +++ b/candle-transformers/src/models/quantized_t5.rs @@ -775,8 +775,6 @@ impl T5ForConditionalGeneration { Some(ref lm_head) => lm_head.forward(&sequence_output)?, } }; - - // TODO: Rescale output before projecting on vocab? * (self.model_dim**-0.5) Ok(output) } diff --git a/candle-transformers/src/models/t5.rs b/candle-transformers/src/models/t5.rs index c5d5724a..84704ca9 100644 --- a/candle-transformers/src/models/t5.rs +++ b/candle-transformers/src/models/t5.rs @@ -779,8 +779,6 @@ impl T5ForConditionalGeneration { Some(ref lm_head) => lm_head.forward(&sequence_output)?, } }; - - // TODO: Rescale output before projecting on vocab? * (self.model_dim**-0.5) Ok(output) }