summaryrefslogtreecommitdiff
path: root/candle-core/src/quantized/k_quants.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2023-10-03 12:10:58 +0100
committerGitHub <noreply@github.com>2023-10-03 12:10:58 +0100
commitdac73edb3468565fe9817166675db6e422a49767 (patch)
treec88994a7cbe4939eda213f44a22773c2df702a33 /candle-core/src/quantized/k_quants.rs
parentb4da19d1be0241883b55f1a8cbdaeea21f95c3ca (diff)
downloadcandle-dac73edb3468565fe9817166675db6e422a49767.tar.gz
candle-dac73edb3468565fe9817166675db6e422a49767.tar.bz2
candle-dac73edb3468565fe9817166675db6e422a49767.zip
AVX optimized q8k vecdot. (#1024)
Diffstat (limited to 'candle-core/src/quantized/k_quants.rs')
-rw-r--r--candle-core/src/quantized/k_quants.rs3
1 files changed, 3 insertions, 0 deletions
diff --git a/candle-core/src/quantized/k_quants.rs b/candle-core/src/quantized/k_quants.rs
index 80d36555..7567c446 100644
--- a/candle-core/src/quantized/k_quants.rs
+++ b/candle-core/src/quantized/k_quants.rs
@@ -1758,6 +1758,9 @@ impl GgmlType for BlockQ8K {
#[allow(unreachable_code)]
fn vec_dot(n: usize, xs: &[Self], ys: &[Self::VecDotType]) -> Result<f32> {
+ #[cfg(target_feature = "avx")]
+ return super::avx::vec_dot_q8k_q8k(n, xs, ys);
+
#[cfg(target_feature = "neon")]
return super::neon::vec_dot_q8k_q8k(n, xs, ys);