Fix softmax for long sequences (missing barrier).

This commit is contained in:
Nicolas Patry
2023-12-14 19:37:03 +01:00
parent f419a38e1a
commit 4eeaf205d6
3 changed files with 50 additions and 18 deletions

View File

@ -126,7 +126,7 @@ impl MetalDevice {
}
let new_buffer = self.device.new_buffer(size as NSUInteger, option);
let new_buffer = Arc::new(new_buffer);
// subbuffers.push(new_buffer.clone());
subbuffers.push(new_buffer.clone());
// println!("Created tensor {size} {name}");
for subbuffers in buffers.values_mut() {
let newbuffers = subbuffers