summaryrefslogtreecommitdiff
path: root/candle-transformers/src/quantized_var_builder.rs
diff options
context:
space:
mode:
Diffstat (limited to 'candle-transformers/src/quantized_var_builder.rs')
-rw-r--r--candle-transformers/src/quantized_var_builder.rs6
1 files changed, 6 insertions, 0 deletions
diff --git a/candle-transformers/src/quantized_var_builder.rs b/candle-transformers/src/quantized_var_builder.rs
index 875a2b45..2ac64aa5 100644
--- a/candle-transformers/src/quantized_var_builder.rs
+++ b/candle-transformers/src/quantized_var_builder.rs
@@ -1,3 +1,9 @@
+//! Varbuilder for Loading gguf files
+//!
+//! VarBuilder is a utility to store quantized tensors from a [GGUF model file](https://huggingface.co/docs/hub/gguf).
+//! These tensors can be loaded from disk using `from_gguf` or from an in-memory
+//! buffer using `from_gguf_buffer`.
+
use candle::quantized::QTensor;
use candle::{Device, Result, Shape};
use std::sync::Arc;