mirror of
https://github.com/huggingface/candle.git
synced 2025-06-17 02:58:50 +00:00

* module docs * varbuilder gguf docs * add a link to gguf files * small additonal mod doc titles * safetensor docs * more core docs * more module docs in canlde_core * 2 more link fixes
153 lines
4.6 KiB
Rust
153 lines
4.6 KiB
Rust
//! Traits to Define Backend Behavior
|
|
//!
|
|
use crate::op::{BinaryOpT, CmpOp, ReduceOp, UnaryOpT};
|
|
use crate::{CpuStorage, DType, Layout, Result, Shape};
|
|
|
|
pub trait BackendStorage: Sized {
|
|
type Device: BackendDevice;
|
|
|
|
fn try_clone(&self, _: &Layout) -> Result<Self>;
|
|
|
|
fn dtype(&self) -> DType;
|
|
|
|
fn device(&self) -> &Self::Device;
|
|
|
|
// Maybe this should return a Cow instead so that no copy is done on the cpu case.
|
|
fn to_cpu_storage(&self) -> Result<CpuStorage>;
|
|
|
|
fn affine(&self, _: &Layout, _: f64, _: f64) -> Result<Self>;
|
|
|
|
fn powf(&self, _: &Layout, _: f64) -> Result<Self>;
|
|
|
|
fn elu(&self, _: &Layout, _: f64) -> Result<Self>;
|
|
|
|
fn reduce_op(&self, _: ReduceOp, _: &Layout, _: &[usize]) -> Result<Self>;
|
|
|
|
fn cmp(&self, _: CmpOp, _: &Self, _: &Layout, _: &Layout) -> Result<Self>;
|
|
|
|
fn to_dtype(&self, _: &Layout, _: DType) -> Result<Self>;
|
|
|
|
fn unary_impl<B: UnaryOpT>(&self, _: &Layout) -> Result<Self>;
|
|
|
|
fn binary_impl<B: BinaryOpT>(&self, _: &Self, _: &Layout, _: &Layout) -> Result<Self>;
|
|
|
|
fn where_cond(&self, _: &Layout, _: &Self, _: &Layout, _: &Self, _: &Layout) -> Result<Self>;
|
|
|
|
fn conv1d(
|
|
&self,
|
|
_l: &Layout,
|
|
_kernel: &Self,
|
|
_kernel_l: &Layout,
|
|
_params: &crate::conv::ParamsConv1D,
|
|
) -> Result<Self>;
|
|
|
|
fn conv_transpose1d(
|
|
&self,
|
|
_l: &Layout,
|
|
_kernel: &Self,
|
|
_kernel_l: &Layout,
|
|
_params: &crate::conv::ParamsConvTranspose1D,
|
|
) -> Result<Self>;
|
|
|
|
fn conv2d(
|
|
&self,
|
|
_l: &Layout,
|
|
_kernel: &Self,
|
|
_kernel_l: &Layout,
|
|
_params: &crate::conv::ParamsConv2D,
|
|
) -> Result<Self>;
|
|
|
|
fn conv_transpose2d(
|
|
&self,
|
|
_l: &Layout,
|
|
_kernel: &Self,
|
|
_kernel_l: &Layout,
|
|
_params: &crate::conv::ParamsConvTranspose2D,
|
|
) -> Result<Self>;
|
|
|
|
fn avg_pool2d(&self, _: &Layout, _: (usize, usize), _: (usize, usize)) -> Result<Self>;
|
|
fn max_pool2d(&self, _: &Layout, _: (usize, usize), _: (usize, usize)) -> Result<Self>;
|
|
fn upsample_nearest1d(&self, _: &Layout, _: usize) -> Result<Self>;
|
|
fn upsample_nearest2d(&self, _: &Layout, _: usize, _: usize) -> Result<Self>;
|
|
|
|
fn gather(&self, _: &Layout, _: &Self, _: &Layout, _: usize) -> Result<Self>;
|
|
fn scatter_add(
|
|
&self,
|
|
_: &Layout,
|
|
_: &Self,
|
|
_: &Layout,
|
|
_: &Self,
|
|
_: &Layout,
|
|
_: usize,
|
|
) -> Result<Self>;
|
|
fn index_select(&self, _: &Self, _: &Layout, _: &Layout, _: usize) -> Result<Self>;
|
|
fn index_add(
|
|
&self,
|
|
_: &Layout,
|
|
_: &Self,
|
|
_: &Layout,
|
|
_: &Self,
|
|
_: &Layout,
|
|
_: usize,
|
|
) -> Result<Self>;
|
|
|
|
fn matmul(
|
|
&self,
|
|
_: &Self,
|
|
_: (usize, usize, usize, usize),
|
|
_: &Layout,
|
|
_: &Layout,
|
|
) -> Result<Self>;
|
|
|
|
fn copy_strided_src(&self, _: &mut Self, _: usize, _: &Layout) -> Result<()>;
|
|
|
|
#[allow(clippy::too_many_arguments)]
|
|
// Similar to cudaMemcpy2D, though values are in elements and not in bytes.
|
|
fn copy2d(
|
|
&self,
|
|
_: &mut Self,
|
|
_d1: usize,
|
|
_d2: usize,
|
|
_src_stride1: usize,
|
|
_dst_stride1: usize,
|
|
_src_offset: usize,
|
|
_dst_offset: usize,
|
|
) -> Result<()>;
|
|
}
|
|
|
|
pub trait BackendDevice: Sized + std::fmt::Debug + Clone {
|
|
type Storage: BackendStorage;
|
|
|
|
// TODO: Make the usize generic and part of a generic DeviceLocation.
|
|
fn new(_: usize) -> Result<Self>;
|
|
|
|
fn location(&self) -> crate::DeviceLocation;
|
|
|
|
fn same_device(&self, _: &Self) -> bool;
|
|
|
|
fn zeros_impl(&self, _shape: &Shape, _dtype: DType) -> Result<Self::Storage>;
|
|
|
|
fn ones_impl(&self, _shape: &Shape, _dtype: DType) -> Result<Self::Storage>;
|
|
|
|
/// # Safety
|
|
/// This function is unsafe as it doesn't initialize the underlying data store.
|
|
/// The caller should ensure that the data is properly initialized as early as possible
|
|
/// after this call.
|
|
unsafe fn alloc_uninit(&self, _shape: &Shape, _dtype: DType) -> Result<Self::Storage>;
|
|
|
|
fn storage_from_slice<T: crate::WithDType>(&self, _: &[T]) -> Result<Self::Storage>;
|
|
|
|
fn storage_from_cpu_storage(&self, _: &CpuStorage) -> Result<Self::Storage>;
|
|
|
|
fn storage_from_cpu_storage_owned(&self, _: CpuStorage) -> Result<Self::Storage>;
|
|
|
|
fn rand_uniform(&self, _: &Shape, _: DType, _: f64, _: f64) -> Result<Self::Storage>;
|
|
|
|
fn rand_normal(&self, _: &Shape, _: DType, _: f64, _: f64) -> Result<Self::Storage>;
|
|
|
|
fn set_seed(&self, _: u64) -> Result<()>;
|
|
|
|
/// Synchronize should block until all the operations on the device are completed.
|
|
fn synchronize(&self) -> Result<()>;
|
|
}
|