summaryrefslogtreecommitdiff
path: root/candle-transformers/src/models/llama2_c_weights.rs
diff options
context:
space:
mode:
Diffstat (limited to 'candle-transformers/src/models/llama2_c_weights.rs')
-rw-r--r--candle-transformers/src/models/llama2_c_weights.rs6
1 files changed, 6 insertions, 0 deletions
diff --git a/candle-transformers/src/models/llama2_c_weights.rs b/candle-transformers/src/models/llama2_c_weights.rs
index e5a8bb88..8149c214 100644
--- a/candle-transformers/src/models/llama2_c_weights.rs
+++ b/candle-transformers/src/models/llama2_c_weights.rs
@@ -1,3 +1,9 @@
+//! Llama2 inference implementation.
+//!
+//! See ["LLaMA 2: Open Foundation and Fine-Tuned Chat Models"](https://arxiv.org/abs/2307.09288)
+//!
+//! Based on the [llama2.c](https://github.com/karpathy/llama2.c) implementation
+
use byteorder::{LittleEndian, ReadBytesExt};
use candle::{DType, Device, IndexOp, Result, Shape, Tensor};
use candle_nn::VarBuilder;