summaryrefslogtreecommitdiff
path: root/candle-nn/examples
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2023-10-02 17:17:46 +0100
committerGitHub <noreply@github.com>2023-10-02 17:17:46 +0100
commit089fc3b5847668469cad740f29412d19d9e9fecf (patch)
tree57affdeeee6607066dfbc416db8ca5617ac7f0af /candle-nn/examples
parente04c789230c609c285991b78c29f1d6eef0d104f (diff)
downloadcandle-089fc3b5847668469cad740f29412d19d9e9fecf.tar.gz
candle-089fc3b5847668469cad740f29412d19d9e9fecf.tar.bz2
candle-089fc3b5847668469cad740f29412d19d9e9fecf.zip
Improve the quantized whisper setup. (#1018)
* Improve the quantized whisper setup. * Fix the config file paths. * Use the standard matmul where possible.
Diffstat (limited to 'candle-nn/examples')
-rw-r--r--candle-nn/examples/cpu_benchmarks.rs2
1 files changed, 1 insertions, 1 deletions
diff --git a/candle-nn/examples/cpu_benchmarks.rs b/candle-nn/examples/cpu_benchmarks.rs
index 204a7109..e58ea727 100644
--- a/candle-nn/examples/cpu_benchmarks.rs
+++ b/candle-nn/examples/cpu_benchmarks.rs
@@ -206,7 +206,7 @@ impl Benchmark for QMatMul {
fn preprocess() -> Result<Self::PreProcessData> {
let zeros = vec![candle::quantized::k_quants::BlockQ4_0::zeros(); 4096 * 11008 / 32];
let mm = candle::quantized::QTensor::new(zeros, (4096, 11008))?;
- let mm = candle::quantized::QMatMul::from_qtensor(mm);
+ let mm = candle::quantized::QMatMul::from_qtensor(mm)?;
let arg = Tensor::randn(0f32, 1., (128, 11008), &Device::Cpu)?;
Ok((mm, arg))
}