diff options
author | Laurent Mazare <laurent.mazare@gmail.com> | 2023-10-27 15:34:06 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-10-27 15:34:06 +0100 |
commit | e2826e70b3725c53656f1ff76753472b29e1c5f7 (patch) | |
tree | 3e4482888e35b753666936e8ed189a5bffaa2e63 /candle-core/src/quantized/simd128.rs | |
parent | 916619f70bfae089597ce421e19a3b2e85c2d27b (diff) | |
download | candle-e2826e70b3725c53656f1ff76753472b29e1c5f7.tar.gz candle-e2826e70b3725c53656f1ff76753472b29e1c5f7.tar.bz2 candle-e2826e70b3725c53656f1ff76753472b29e1c5f7.zip |
Add a quantized variant of llama2.c (#1197)
* Add a quantized variant of llama2.c
* Clippy fixes.
Diffstat (limited to 'candle-core/src/quantized/simd128.rs')
-rw-r--r-- | candle-core/src/quantized/simd128.rs | 4 |
1 files changed, 0 insertions, 4 deletions
diff --git a/candle-core/src/quantized/simd128.rs b/candle-core/src/quantized/simd128.rs index 687399c2..f256fdc2 100644 --- a/candle-core/src/quantized/simd128.rs +++ b/candle-core/src/quantized/simd128.rs @@ -61,10 +61,6 @@ pub(crate) fn vec_dot_q8_0_q8_0(n: usize, xs: &[BlockQ8_0], ys: &[BlockQ8_0]) -> if n % QK8_0 != 0 { crate::bail!("vec_dot_q8_0_q8_0: {n} is not divisible by {qk}") } - let nb = n / QK8_0; - if nb % 2 != 0 { - crate::bail!("vec_dot_q8_0_q8_0: {nb} is not even") - } unsafe { let mut acc = f32x4_splat(0.0f32); for (x, y) in xs.iter().zip(ys.iter()) { |