Add some documentation and test to the linear layer. (#151)

* Add some documentation and test to the linear layer. * Layer norm doc. * Minor tweaks.
author: Laurent Mazare <laurent.mazare@gmail.com> 2023-07-12 20:24:23 +0100
committer: GitHub <noreply@github.com> 2023-07-12 20:24:23 +0100
commit: 465fc8c0c5bae73d1ab4c119daa26bb04312a39f (patch)
tree: ca5f0056144db48714312379ea9437960550beee /candle-nn/src
parent: f09d7e565326b609c3a64505de910bbaedce8a1c (diff)
download: candle-465fc8c0c5bae73d1ab4c119daa26bb04312a39f.tar.gz
candle-465fc8c0c5bae73d1ab4c119daa26bb04312a39f.tar.bz2
candle-465fc8c0c5bae73d1ab4c119daa26bb04312a39f.zip
4 files changed, 51 insertions, 0 deletions
diff --git a/candle-nn/src/conv.rs b/candle-nn/src/conv.rs
index e670a0d2..d938cae4 100644
--- a/candle-nn/src/conv.rs
+++ b/candle-nn/src/conv.rs
@@ -1,3 +1,4 @@
+//! Convolution Layers.
 use candle::{Result, Tensor};
 
 #[derive(Debug, Clone, Copy, PartialEq, Eq)]
diff --git a/candle-nn/src/embedding.rs b/candle-nn/src/embedding.rs
index deeba01e..a0a853b0 100644
--- a/candle-nn/src/embedding.rs
+++ b/candle-nn/src/embedding.rs
@@ -1,3 +1,4 @@
+//! Embedding Layer.
 use candle::{Result, Tensor};
 
 #[derive(Debug)]
diff --git a/candle-nn/src/layer_norm.rs b/candle-nn/src/layer_norm.rs
index 0b208c49..188a02bf 100644
--- a/candle-nn/src/layer_norm.rs
+++ b/candle-nn/src/layer_norm.rs
@@ -1,3 +1,33 @@
+//! Layer Normalization.
+//!
+//! This layer applies Layer Normalization over a mini-batch of inputs as described in [`Layer
+//! Normalization`]. The input is expected to have three dimensions: a batch dimension, a length,
+//! and a hidden size, the normalization is applied over the last dimension.
+//!
+//! # Example
+//!
+//! ```rust
+//! use candle::{Tensor, Device::Cpu};
+//! use candle_nn::LayerNorm;
+//! # fn main() -> candle::Result<()> {
+//!
+//! let w = Tensor::new(1f32, &Cpu)?;
+//! let b = Tensor::new(0f32, &Cpu)?;
+//! let layer = LayerNorm::new(w, b, 1e-5);
+//!
+//! let xs = Tensor::new(
+//!     &[[[1f32, 2., 3.], [4., 5., 6.], [9., 8., 7.]]],
+//!     &Cpu)?;
+//! let ys = layer.forward(&xs)?;
+//! assert_eq!(
+//!     ys.to_vec3::<f32>()?,
+//!     &[[[-1.2247356, 0.0,  1.2247356],
+//!        [-1.2247356, 0.0,  1.2247356],
+//!        [ 1.2247356, 0.0, -1.2247356]]]);
+//! # Ok(()) }
+//! ```
+//!
+//! [`Layer Normalization`]: https://arxiv.org/abs/1607.06450
 use candle::{DType, Result, Tensor};
 
 // This layer norm version handles both weight and bias so removes the mean.
diff --git a/candle-nn/src/linear.rs b/candle-nn/src/linear.rs
index 2e65ca2d..943011c9 100644
--- a/candle-nn/src/linear.rs
+++ b/candle-nn/src/linear.rs
@@ -1,3 +1,22 @@
+//! Linear layer
+//!
+//! This layer applies a linear transformation to the incoming data, `y = x@w.t() + b`.
+//! The bias is optional. The `forward` method can be used to apply the layer, it supports input
+//! with a batch dimension (so of shape `(b_sz, in_c)`) or without (of shape `(in_c,)`), the
+//! output has shape `(b_sz, out_c)` and `(out_c,)` respectively.
+//!
+//! ```rust
+//! use candle::{Tensor, Device::Cpu};
+//! use candle_nn::Linear;
+//! # fn main() -> candle::Result<()> {
+//!
+//! let w = Tensor::new(&[[1f32, 2.], [3., 4.], [5., 6.]], &Cpu)?;
+//! let layer = Linear::new(w, None); // Use no bias.
+//! let xs = Tensor::new(&[[10f32, 100.]], &Cpu)?;
+//! let ys = layer.forward(&xs)?;
+//! assert_eq!(ys.to_vec2::<f32>()?, &[[210.0, 430.0, 650.0]]);
+//! # Ok(()) }
+//! ```
 use candle::Tensor;
 
 #[derive(Debug)]
author	Laurent Mazare <laurent.mazare@gmail.com>	2023-07-12 20:24:23 +0100
committer	GitHub <noreply@github.com>	2023-07-12 20:24:23 +0100
commit	465fc8c0c5bae73d1ab4c119daa26bb04312a39f (patch)
tree	ca5f0056144db48714312379ea9437960550beee /candle-nn/src
parent	f09d7e565326b609c3a64505de910bbaedce8a1c (diff)
download	candle-465fc8c0c5bae73d1ab4c119daa26bb04312a39f.tar.gz candle-465fc8c0c5bae73d1ab4c119daa26bb04312a39f.tar.bz2 candle-465fc8c0c5bae73d1ab4c119daa26bb04312a39f.zip