mirror of
https://github.com/huggingface/candle.git
synced 2025-06-18 11:37:11 +00:00
Add an optimized case when performing the softmax over the last dimension. (#195)
This commit is contained in:
@ -785,6 +785,19 @@ fn divide_by_sum_over_dim<T: WithDType>(s: &mut [T], shape: &Shape, dim: usize)
|
||||
let elem_per_slice = dims[dim];
|
||||
let prod_pre_dim = dims[..dim].iter().product();
|
||||
let prod_post_dim = dims[dim + 1..].iter().product();
|
||||
if prod_post_dim == 1 {
|
||||
for pre_idx in 0..prod_pre_dim {
|
||||
let mut sum = 0f64;
|
||||
let idx = pre_idx * elem_per_slice;
|
||||
for v in s[idx..idx + elem_per_slice].iter() {
|
||||
sum += v.to_f64();
|
||||
}
|
||||
let sum = T::from_f64(sum);
|
||||
for v in s[idx..idx + elem_per_slice].iter_mut() {
|
||||
*v /= sum
|
||||
}
|
||||
}
|
||||
} else {
|
||||
for pre_idx in 0..prod_pre_dim {
|
||||
for post_idx in 0..prod_post_dim {
|
||||
let mut sum = 0f64;
|
||||
@ -801,6 +814,7 @@ fn divide_by_sum_over_dim<T: WithDType>(s: &mut [T], shape: &Shape, dim: usize)
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
Ok(())
|
||||
}
|
||||
|
||||
|
Reference in New Issue
Block a user