Affine metal kernel works. Need to extract buffer contents based on layout offset (like CudaSlice.slice) for candle intergration

This commit is contained in:
Ivar Flakstad
2023-11-06 04:46:53 +01:00
parent 6d4c8c0707
commit 8124d1003f
4 changed files with 188 additions and 8 deletions

View File

@ -190,7 +190,7 @@ impl candle::CustomOp1 for SoftmaxLastDim {
device: dev.clone(),
};
Ok((dst, layout.shape().clone()))
}
}
#[cfg(feature = "metal")]
fn metal_fwd(