diff options
author | Laurent Mazare <laurent.mazare@gmail.com> | 2023-08-29 09:41:17 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-08-29 09:41:17 +0100 |
commit | 4b8d57ba15471f8f321e89a0114bffb97fe4b618 (patch) | |
tree | a30b0824c2b24857c7f3feae31813d76f3b76965 /candle-core/src/quantized/k_quants.rs | |
parent | 33c23c19b6f4821c00a47758f7841baf52ba9081 (diff) | |
download | candle-4b8d57ba15471f8f321e89a0114bffb97fe4b618.tar.gz candle-4b8d57ba15471f8f321e89a0114bffb97fe4b618.tar.bz2 candle-4b8d57ba15471f8f321e89a0114bffb97fe4b618.zip |
AVX version of the q4k vecdot. (#651)
Diffstat (limited to 'candle-core/src/quantized/k_quants.rs')
-rw-r--r-- | candle-core/src/quantized/k_quants.rs | 3 |
1 files changed, 3 insertions, 0 deletions
diff --git a/candle-core/src/quantized/k_quants.rs b/candle-core/src/quantized/k_quants.rs index 7b405ec9..7f14600b 100644 --- a/candle-core/src/quantized/k_quants.rs +++ b/candle-core/src/quantized/k_quants.rs @@ -1104,6 +1104,9 @@ impl GgmlType for BlockQ4K { #[allow(unreachable_code)] fn vec_dot(n: usize, xs: &[Self], ys: &[Self::VecDotType]) -> Result<f32> { + #[cfg(target_feature = "avx")] + return super::avx::vec_dot_q4k_q8k(n, xs, ys); + #[cfg(target_feature = "neon")] return super::neon::vec_dot_q4k_q8k(n, xs, ys); |