//! Traits to Define Backend Behavior //! use crate::op::{BinaryOpT, CmpOp, ReduceOp, UnaryOpT}; use crate::{CpuStorage, DType, Layout, Result, Shape}; pub trait BackendStorage: Sized { type Device: BackendDevice; fn try_clone(&self, _: &Layout) -> Result; fn dtype(&self) -> DType; fn device(&self) -> &Self::Device; // Maybe this should return a Cow instead so that no copy is done on the cpu case. fn to_cpu_storage(&self) -> Result; fn affine(&self, _: &Layout, _: f64, _: f64) -> Result; fn powf(&self, _: &Layout, _: f64) -> Result; fn elu(&self, _: &Layout, _: f64) -> Result; fn reduce_op(&self, _: ReduceOp, _: &Layout, _: &[usize]) -> Result; fn cmp(&self, _: CmpOp, _: &Self, _: &Layout, _: &Layout) -> Result; fn to_dtype(&self, _: &Layout, _: DType) -> Result; fn unary_impl(&self, _: &Layout) -> Result; fn binary_impl(&self, _: &Self, _: &Layout, _: &Layout) -> Result; fn where_cond(&self, _: &Layout, _: &Self, _: &Layout, _: &Self, _: &Layout) -> Result; fn conv1d( &self, _l: &Layout, _kernel: &Self, _kernel_l: &Layout, _params: &crate::conv::ParamsConv1D, ) -> Result; fn conv_transpose1d( &self, _l: &Layout, _kernel: &Self, _kernel_l: &Layout, _params: &crate::conv::ParamsConvTranspose1D, ) -> Result; fn conv2d( &self, _l: &Layout, _kernel: &Self, _kernel_l: &Layout, _params: &crate::conv::ParamsConv2D, ) -> Result; fn conv_transpose2d( &self, _l: &Layout, _kernel: &Self, _kernel_l: &Layout, _params: &crate::conv::ParamsConvTranspose2D, ) -> Result; fn avg_pool2d(&self, _: &Layout, _: (usize, usize), _: (usize, usize)) -> Result; fn max_pool2d(&self, _: &Layout, _: (usize, usize), _: (usize, usize)) -> Result; fn upsample_nearest1d(&self, _: &Layout, _: usize) -> Result; fn upsample_nearest2d(&self, _: &Layout, _: usize, _: usize) -> Result; fn gather(&self, _: &Layout, _: &Self, _: &Layout, _: usize) -> Result; fn scatter_add( &self, _: &Layout, _: &Self, _: &Layout, _: &Self, _: &Layout, _: usize, ) -> Result; fn index_select(&self, _: &Self, _: &Layout, _: &Layout, _: usize) -> Result; fn index_add( &self, _: &Layout, _: &Self, _: &Layout, _: &Self, _: &Layout, _: usize, ) -> Result; fn matmul( &self, _: &Self, _: (usize, usize, usize, usize), _: &Layout, _: &Layout, ) -> Result; fn copy_strided_src(&self, _: &mut Self, _: usize, _: &Layout) -> Result<()>; #[allow(clippy::too_many_arguments)] // Similar to cudaMemcpy2D, though values are in elements and not in bytes. fn copy2d( &self, _: &mut Self, _d1: usize, _d2: usize, _src_stride1: usize, _dst_stride1: usize, _src_offset: usize, _dst_offset: usize, ) -> Result<()>; } pub trait BackendDevice: Sized + std::fmt::Debug + Clone { type Storage: BackendStorage; // TODO: Make the usize generic and part of a generic DeviceLocation. fn new(_: usize) -> Result; fn location(&self) -> crate::DeviceLocation; fn same_device(&self, _: &Self) -> bool; fn zeros_impl(&self, _shape: &Shape, _dtype: DType) -> Result; fn ones_impl(&self, _shape: &Shape, _dtype: DType) -> Result; /// # Safety /// This function is unsafe as it doesn't initialize the underlying data store. /// The caller should ensure that the data is properly initialized as early as possible /// after this call. unsafe fn alloc_uninit(&self, _shape: &Shape, _dtype: DType) -> Result; fn storage_from_slice(&self, _: &[T]) -> Result; fn storage_from_cpu_storage(&self, _: &CpuStorage) -> Result; fn storage_from_cpu_storage_owned(&self, _: CpuStorage) -> Result; fn rand_uniform(&self, _: &Shape, _: DType, _: f64, _: f64) -> Result; fn rand_normal(&self, _: &Shape, _: DType, _: f64, _: f64) -> Result; fn set_seed(&self, _: u64) -> Result<()>; /// Synchronize should block until all the operations on the device are completed. fn synchronize(&self) -> Result<()>; }