summaryrefslogtreecommitdiff
path: root/candle-core/src/quantized/k_quants.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2023-08-29 09:41:17 +0100
committerGitHub <noreply@github.com>2023-08-29 09:41:17 +0100
commit4b8d57ba15471f8f321e89a0114bffb97fe4b618 (patch)
treea30b0824c2b24857c7f3feae31813d76f3b76965 /candle-core/src/quantized/k_quants.rs
parent33c23c19b6f4821c00a47758f7841baf52ba9081 (diff)
downloadcandle-4b8d57ba15471f8f321e89a0114bffb97fe4b618.tar.gz
candle-4b8d57ba15471f8f321e89a0114bffb97fe4b618.tar.bz2
candle-4b8d57ba15471f8f321e89a0114bffb97fe4b618.zip
AVX version of the q4k vecdot. (#651)
Diffstat (limited to 'candle-core/src/quantized/k_quants.rs')
-rw-r--r--candle-core/src/quantized/k_quants.rs3
1 files changed, 3 insertions, 0 deletions
diff --git a/candle-core/src/quantized/k_quants.rs b/candle-core/src/quantized/k_quants.rs
index 7b405ec9..7f14600b 100644
--- a/candle-core/src/quantized/k_quants.rs
+++ b/candle-core/src/quantized/k_quants.rs
@@ -1104,6 +1104,9 @@ impl GgmlType for BlockQ4K {
#[allow(unreachable_code)]
fn vec_dot(n: usize, xs: &[Self], ys: &[Self::VecDotType]) -> Result<f32> {
+ #[cfg(target_feature = "avx")]
+ return super::avx::vec_dot_q4k_q8k(n, xs, ys);
+
#[cfg(target_feature = "neon")]
return super::neon::vec_dot_q4k_q8k(n, xs, ys);