summaryrefslogtreecommitdiff
path: root/candle-core/src/dummy_metal_backend.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2024-03-17 10:49:13 +0100
committerGitHub <noreply@github.com>2024-03-17 10:49:13 +0100
commitce9fbc368211815ef2dddff01575ca1f9d4eccd5 (patch)
treee260edd957ab716d1789da05059c9a79696b0730 /candle-core/src/dummy_metal_backend.rs
parentdb8b24ae92419377283821ee0a65fb224a4f3c4d (diff)
downloadcandle-ce9fbc368211815ef2dddff01575ca1f9d4eccd5.tar.gz
candle-ce9fbc368211815ef2dddff01575ca1f9d4eccd5.tar.bz2
candle-ce9fbc368211815ef2dddff01575ca1f9d4eccd5.zip
Optimize the cat operation on contiguous tensors (#1855)
* Add a specialized kernel for copy2d. * Move the cat operations. * Avoid transpositions in cat. * Bugfix. * Bugfix for the cuda kernel. * Add a benchmark. * Add more testing. * Test fix. * Faster kernel. * Add the missing kernel. * Tweak the test. * Add a metal kernel. * Fix for the metal kernel. * Get the tests to pass on metal. * Also use this opportunity to fix the metal kernel for ELU. * Add some bf16 kernels. * Clippy fixes.
Diffstat (limited to 'candle-core/src/dummy_metal_backend.rs')
-rw-r--r--candle-core/src/dummy_metal_backend.rs13
1 files changed, 13 insertions, 0 deletions
diff --git a/candle-core/src/dummy_metal_backend.rs b/candle-core/src/dummy_metal_backend.rs
index e9d92331..791ec153 100644
--- a/candle-core/src/dummy_metal_backend.rs
+++ b/candle-core/src/dummy_metal_backend.rs
@@ -166,6 +166,19 @@ impl crate::backend::BackendStorage for MetalStorage {
Err(Error::NotCompiledWithMetalSupport)
}
+ fn copy2d(
+ &self,
+ _: &mut Self,
+ _: usize,
+ _: usize,
+ _: usize,
+ _: usize,
+ _: usize,
+ _: usize,
+ ) -> Result<()> {
+ Err(Error::NotCompiledWithMetalSupport)
+ }
+
fn avg_pool2d(&self, _: &Layout, _: (usize, usize), _: (usize, usize)) -> Result<Self> {
Err(Error::NotCompiledWithMetalSupport)
}