summaryrefslogtreecommitdiff
path: root/candle-transformers/src/models/bigcode.rs
diff options
context:
space:
mode:
Diffstat (limited to 'candle-transformers/src/models/bigcode.rs')
-rw-r--r--candle-transformers/src/models/bigcode.rs18
1 files changed, 17 insertions, 1 deletions
diff --git a/candle-transformers/src/models/bigcode.rs b/candle-transformers/src/models/bigcode.rs
index 8ed1462b..c5dcb6bc 100644
--- a/candle-transformers/src/models/bigcode.rs
+++ b/candle-transformers/src/models/bigcode.rs
@@ -1,9 +1,25 @@
//! BigCode implementation in Rust based on the GPT-BigCode model.
//!
-//! See "StarCoder: A State-of-the-Art LLM for Code", Mukherjee et al. 2023
+//! [StarCoder/BigCode](https://huggingface.co/bigcode/starcoderbase-1b) is a LLM
+//! model specialized to code generation. The initial model was trained on 80
+//! programming languages. See "StarCoder: A State-of-the-Art LLM for Code", Mukherjee et al. 2023
//! - [Arxiv](https://arxiv.org/abs/2305.06161)
//! - [Github](https://github.com/bigcode-project/starcoder)
//!
+//! ## Running some example
+//!
+//! ```bash
+//! cargo run --example bigcode --release -- --prompt "fn fact(n: u64) -> u64"
+//!
+//! > fn fact(n: u64) -> u64 {
+//! > if n == 0 {
+//! > 1
+//! > } else {
+//! > n * fact(n - 1)
+//! > }
+//! > }
+//! ```
+//!
use candle::{DType, Device, IndexOp, Result, Tensor, D};
use candle_nn::{embedding, linear_b as linear, Embedding, LayerNorm, Linear, Module, VarBuilder};