summaryrefslogtreecommitdiff
path: root/candle-transformers/src/models/phi.rs
diff options
context:
space:
mode:
Diffstat (limited to 'candle-transformers/src/models/phi.rs')
-rw-r--r--candle-transformers/src/models/phi.rs17
1 files changed, 17 insertions, 0 deletions
diff --git a/candle-transformers/src/models/phi.rs b/candle-transformers/src/models/phi.rs
index bffc14fa..36a08bb3 100644
--- a/candle-transformers/src/models/phi.rs
+++ b/candle-transformers/src/models/phi.rs
@@ -1,3 +1,20 @@
+//! Microsoft Phi model implementation
+//!
+//! See Phi model details at:
+//! - [Phi-2 Model](https://huggingface.co/microsoft/phi-2)
+//!
+//! The Phi series are decoder-only transformers designed for code and language tasks.
+//! Key characteristics:
+//! - Decoder-only transformer architecture
+//! - RoPE embeddings
+//! - Layer normalization
+//! - QK normalization
+//!
+//! References:
+//! - [Hugging Face Implementation](https://huggingface.co/microsoft/phi-2)
+//! - [Alternative Implementation](https://huggingface.co/microsoft/phi-2/tree/main)
+//!
+
use crate::models::with_tracing::{layer_norm, linear, Embedding, LayerNorm, Linear};
/// Phi model.
/// https://huggingface.co/microsoft/phi-2