summaryrefslogtreecommitdiff
path: root/candle-transformers/src/quantized_nn.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2024-03-12 11:30:24 +0100
committerGitHub <noreply@github.com>2024-03-12 11:30:24 +0100
commitff03fd3fb314980d3273ffc49826d764541d76e2 (patch)
treedaf07e953c992146e67f593e94819ef66822dfe8 /candle-transformers/src/quantized_nn.rs
parentdf5f69444e438a7cd8d8ab4971579bf309b72114 (diff)
downloadcandle-ff03fd3fb314980d3273ffc49826d764541d76e2.tar.gz
candle-ff03fd3fb314980d3273ffc49826d764541d76e2.tar.bz2
candle-ff03fd3fb314980d3273ffc49826d764541d76e2.zip
Expose some helper functions to create quantized models. (#1837)
Diffstat (limited to 'candle-transformers/src/quantized_nn.rs')
-rw-r--r--candle-transformers/src/quantized_nn.rs8
1 files changed, 8 insertions, 0 deletions
diff --git a/candle-transformers/src/quantized_nn.rs b/candle-transformers/src/quantized_nn.rs
index 21c88430..bb0a8641 100644
--- a/candle-transformers/src/quantized_nn.rs
+++ b/candle-transformers/src/quantized_nn.rs
@@ -35,6 +35,14 @@ pub struct Linear {
}
impl Linear {
+ pub fn from_arc(
+ weight: std::sync::Arc<candle::quantized::QTensor>,
+ bias: Option<Tensor>,
+ ) -> Result<Self> {
+ let weight = QMatMul::from_weights(weight)?;
+ Ok(Self { weight, bias })
+ }
+
pub fn from_weights(weight: QMatMul, bias: Option<Tensor>) -> Self {
Self { weight, bias }
}