summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorcksac <cs.cksac@gmail.com>2023-08-23 18:05:33 +0800
committerGitHub <noreply@github.com>2023-08-23 11:05:33 +0100
commit89a00b56cce79e1735928701c0e45f5c70122adb (patch)
tree7d3a5f67e623140c30a5a4b6c93c21387fa3c4e3
parent9a5c7db91a40bfeab1dbaf1622c67a21f5ad19b8 (diff)
downloadcandle-89a00b56cce79e1735928701c0e45f5c70122adb.tar.gz
candle-89a00b56cce79e1735928701c0e45f5c70122adb.tar.bz2
candle-89a00b56cce79e1735928701c0e45f5c70122adb.zip
add chat models in quantized example (#551)
* add chat models in quantized example * cargo fmt
-rw-r--r--candle-examples/examples/quantized/main.rs18
1 files changed, 18 insertions, 0 deletions
diff --git a/candle-examples/examples/quantized/main.rs b/candle-examples/examples/quantized/main.rs
index 7c457f7a..c4be8974 100644
--- a/candle-examples/examples/quantized/main.rs
+++ b/candle-examples/examples/quantized/main.rs
@@ -391,6 +391,12 @@ enum Which {
L13b,
#[value(name = "70b")]
L70b,
+ #[value(name = "7b-chat")]
+ L7bChat,
+ #[value(name = "13b-chat")]
+ L13bChat,
+ #[value(name = "70b-chat")]
+ L70bChat,
}
#[derive(Parser, Debug)]
@@ -466,6 +472,18 @@ impl Args {
Which::L7b => ("TheBloke/Llama-2-7B-GGML", "llama-2-7b.ggmlv3.q4_0.bin"),
Which::L13b => ("TheBloke/Llama-2-13B-GGML", "llama-2-13b.ggmlv3.q4_0.bin"),
Which::L70b => ("TheBloke/Llama-2-70B-GGML", "llama-2-70b.ggmlv3.q4_0.bin"),
+ Which::L7bChat => (
+ "TheBloke/Llama-2-7B-Chat-GGML",
+ "llama-2-7b-chat.ggmlv3.q4_0.bin",
+ ),
+ Which::L13bChat => (
+ "TheBloke/Llama-2-13B-Chat-GGML",
+ "llama-2-13b-chat.ggmlv3.q4_0.bin",
+ ),
+ Which::L70bChat => (
+ "TheBloke/Llama-2-70B-Chat-GGML",
+ "llama-2-70b-chat.ggmlv3.q4_0.bin",
+ ),
};
let api = hf_hub::api::sync::Api::new()?;
let api = api.model(repo.to_string());