summaryrefslogtreecommitdiff
path: root/candle-core/examples/cuda_sum_benchmark.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2023-08-13 13:53:34 +0200
committerGitHub <noreply@github.com>2023-08-13 12:53:34 +0100
commit9aca398a4fcd87aa095e933583190926359094bf (patch)
tree8b043e1f4d2d5377bceb6c939b7733c8aacc3df5 /candle-core/examples/cuda_sum_benchmark.rs
parent60cd1551ca29b2e3049f18ec8e60b6f165cfe941 (diff)
downloadcandle-9aca398a4fcd87aa095e933583190926359094bf.tar.gz
candle-9aca398a4fcd87aa095e933583190926359094bf.tar.bz2
candle-9aca398a4fcd87aa095e933583190926359094bf.zip
More accelerate optimizations (#427)
* Add more tracing to the whisper example. * Support accelerate in more examples. * Use accelerate for pointwise functions. * Use accelerate for binary operations too. * Bugfix for binary operation: use the rhs before the lhs.
Diffstat (limited to 'candle-core/examples/cuda_sum_benchmark.rs')
-rw-r--r--candle-core/examples/cuda_sum_benchmark.rs3
1 files changed, 3 insertions, 0 deletions
diff --git a/candle-core/examples/cuda_sum_benchmark.rs b/candle-core/examples/cuda_sum_benchmark.rs
index 1c8b0136..d6d182e8 100644
--- a/candle-core/examples/cuda_sum_benchmark.rs
+++ b/candle-core/examples/cuda_sum_benchmark.rs
@@ -1,6 +1,9 @@
#[cfg(feature = "mkl")]
extern crate intel_mkl_src;
+#[cfg(feature = "accelerate")]
+extern crate accelerate_src;
+
use std::str::FromStr;
use anyhow::Result;