diff options
author | Laurent Mazare <laurent.mazare@gmail.com> | 2023-08-23 11:09:55 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-08-23 11:09:55 +0100 |
commit | 0f4ff8a739facafd4b3bc9a003d4a581202b62f8 (patch) | |
tree | 2cc91ab3994996941d8826121880ddd4814562bd /candle-examples/examples/quantized/main.rs | |
parent | 89a00b56cce79e1735928701c0e45f5c70122adb (diff) | |
download | candle-0f4ff8a739facafd4b3bc9a003d4a581202b62f8.tar.gz candle-0f4ff8a739facafd4b3bc9a003d4a581202b62f8.tar.bz2 candle-0f4ff8a739facafd4b3bc9a003d4a581202b62f8.zip |
Fix the quantized example. (#564)
Diffstat (limited to 'candle-examples/examples/quantized/main.rs')
-rw-r--r-- | candle-examples/examples/quantized/main.rs | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/candle-examples/examples/quantized/main.rs b/candle-examples/examples/quantized/main.rs index c4be8974..dfe81632 100644 --- a/candle-examples/examples/quantized/main.rs +++ b/candle-examples/examples/quantized/main.rs @@ -605,8 +605,8 @@ fn main() -> anyhow::Result<()> { ); println!("params: {:?}", model.hparams); let default_gqa = match args.which { - Which::L7b | Which::L13b => 1, - Which::L70b => 8, + Which::L7b | Which::L13b | Which::L7bChat | Which::L13bChat => 1, + Which::L70b | Which::L70bChat => 8, }; ModelWeights::from_ggml(model, args.gqa.unwrap_or(default_gqa))? } |