Avoid the race condition on cuda sums.

2025-06-17 02:58:50 +00:00 · 2023-06-26 16:19:06 +01:00
parent 687c5beb6a
commit f2ac5547fc
3 changed files with 15 additions and 3 deletions
--- a/examples/cuda_basics.rs
+++ b/examples/cuda_basics.rs
@ -3,6 +3,11 @@ use candle::{Device, Tensor};

 fn main() -> Result<()> {
    let device = Device::new_cuda(0)?;
+    let x = Tensor::new(&[[11f32, 22.], [33., 44.], [55., 66.], [77., 78.]], &device)?;
+    println!("> {:?}", x.sum(&[0])?.to_vec2::<f32>()?);
+    println!("> {:?}", x.sum(&[1])?.to_vec2::<f32>()?);
+    println!("> {:?}", x.sum(&[0, 1])?.to_vec2::<f32>()?);
+
    let x = Tensor::new(&[3f32, 1., 4., 1., 5.], &device)?;
    println!("{:?}", x.to_vec1::<f32>()?);
    let y = Tensor::new(&[2f32, 7., 1., 8., 2.], &device)?;