diff options
Diffstat (limited to 'candle-transformers/src/models/phi.rs')
-rw-r--r-- | candle-transformers/src/models/phi.rs | 17 |
1 files changed, 17 insertions, 0 deletions
diff --git a/candle-transformers/src/models/phi.rs b/candle-transformers/src/models/phi.rs index bffc14fa..36a08bb3 100644 --- a/candle-transformers/src/models/phi.rs +++ b/candle-transformers/src/models/phi.rs @@ -1,3 +1,20 @@ +//! Microsoft Phi model implementation +//! +//! See Phi model details at: +//! - [Phi-2 Model](https://huggingface.co/microsoft/phi-2) +//! +//! The Phi series are decoder-only transformers designed for code and language tasks. +//! Key characteristics: +//! - Decoder-only transformer architecture +//! - RoPE embeddings +//! - Layer normalization +//! - QK normalization +//! +//! References: +//! - [Hugging Face Implementation](https://huggingface.co/microsoft/phi-2) +//! - [Alternative Implementation](https://huggingface.co/microsoft/phi-2/tree/main) +//! + use crate::models::with_tracing::{layer_norm, linear, Embedding, LayerNorm, Linear}; /// Phi model. /// https://huggingface.co/microsoft/phi-2 |