summaryrefslogtreecommitdiff
path: root/candle-core/src/quantized/simd128.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2023-10-27 15:34:06 +0100
committerGitHub <noreply@github.com>2023-10-27 15:34:06 +0100
commite2826e70b3725c53656f1ff76753472b29e1c5f7 (patch)
tree3e4482888e35b753666936e8ed189a5bffaa2e63 /candle-core/src/quantized/simd128.rs
parent916619f70bfae089597ce421e19a3b2e85c2d27b (diff)
downloadcandle-e2826e70b3725c53656f1ff76753472b29e1c5f7.tar.gz
candle-e2826e70b3725c53656f1ff76753472b29e1c5f7.tar.bz2
candle-e2826e70b3725c53656f1ff76753472b29e1c5f7.zip
Add a quantized variant of llama2.c (#1197)
* Add a quantized variant of llama2.c * Clippy fixes.
Diffstat (limited to 'candle-core/src/quantized/simd128.rs')
-rw-r--r--candle-core/src/quantized/simd128.rs4
1 files changed, 0 insertions, 4 deletions
diff --git a/candle-core/src/quantized/simd128.rs b/candle-core/src/quantized/simd128.rs
index 687399c2..f256fdc2 100644
--- a/candle-core/src/quantized/simd128.rs
+++ b/candle-core/src/quantized/simd128.rs
@@ -61,10 +61,6 @@ pub(crate) fn vec_dot_q8_0_q8_0(n: usize, xs: &[BlockQ8_0], ys: &[BlockQ8_0]) ->
if n % QK8_0 != 0 {
crate::bail!("vec_dot_q8_0_q8_0: {n} is not divisible by {qk}")
}
- let nb = n / QK8_0;
- if nb % 2 != 0 {
- crate::bail!("vec_dot_q8_0_q8_0: {nb} is not even")
- }
unsafe {
let mut acc = f32x4_splat(0.0f32);
for (x, y) in xs.iter().zip(ys.iter()) {