summaryrefslogtreecommitdiff
path: root/candle-core/examples/llama/main.rs
diff options
context:
space:
mode:
Diffstat (limited to 'candle-core/examples/llama/main.rs')
-rw-r--r--candle-core/examples/llama/main.rs2
1 files changed, 2 insertions, 0 deletions
diff --git a/candle-core/examples/llama/main.rs b/candle-core/examples/llama/main.rs
index eb681f4b..3fc893e3 100644
--- a/candle-core/examples/llama/main.rs
+++ b/candle-core/examples/llama/main.rs
@@ -487,6 +487,7 @@ fn main() -> Result<()> {
let mut rng = thread_rng();
let start_gen = std::time::Instant::now();
for index in 0..args.sample_len {
+ let start_gen = std::time::Instant::now();
let ctxt = &tokens[tokens.len().saturating_sub(CONTEXT_SIZE)..];
let input = Tensor::new(ctxt, &device)?;
let logits = llama.forward(&input, &freqs_cis)?;
@@ -496,6 +497,7 @@ fn main() -> Result<()> {
let next_token = distr.sample(&mut rng) as u32;
tokens.push(next_token);
new_tokens.push(next_token);
+ println!("> {:?}", start_gen.elapsed());
println!(
"{} token: {} '{}'",
index + 1,