diff options
author | Laurent Mazare <laurent.mazare@gmail.com> | 2023-10-02 17:17:46 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-10-02 17:17:46 +0100 |
commit | 089fc3b5847668469cad740f29412d19d9e9fecf (patch) | |
tree | 57affdeeee6607066dfbc416db8ca5617ac7f0af /candle-nn/examples | |
parent | e04c789230c609c285991b78c29f1d6eef0d104f (diff) | |
download | candle-089fc3b5847668469cad740f29412d19d9e9fecf.tar.gz candle-089fc3b5847668469cad740f29412d19d9e9fecf.tar.bz2 candle-089fc3b5847668469cad740f29412d19d9e9fecf.zip |
Improve the quantized whisper setup. (#1018)
* Improve the quantized whisper setup.
* Fix the config file paths.
* Use the standard matmul where possible.
Diffstat (limited to 'candle-nn/examples')
-rw-r--r-- | candle-nn/examples/cpu_benchmarks.rs | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/candle-nn/examples/cpu_benchmarks.rs b/candle-nn/examples/cpu_benchmarks.rs index 204a7109..e58ea727 100644 --- a/candle-nn/examples/cpu_benchmarks.rs +++ b/candle-nn/examples/cpu_benchmarks.rs @@ -206,7 +206,7 @@ impl Benchmark for QMatMul { fn preprocess() -> Result<Self::PreProcessData> { let zeros = vec![candle::quantized::k_quants::BlockQ4_0::zeros(); 4096 * 11008 / 32]; let mm = candle::quantized::QTensor::new(zeros, (4096, 11008))?; - let mm = candle::quantized::QMatMul::from_qtensor(mm); + let mm = candle::quantized::QMatMul::from_qtensor(mm)?; let arg = Tensor::randn(0f32, 1., (128, 11008), &Device::Cpu)?; Ok((mm, arg)) } |