diff options
author | Laurent Mazare <laurent.mazare@gmail.com> | 2024-03-12 11:30:24 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-03-12 11:30:24 +0100 |
commit | ff03fd3fb314980d3273ffc49826d764541d76e2 (patch) | |
tree | daf07e953c992146e67f593e94819ef66822dfe8 /candle-transformers/src/quantized_nn.rs | |
parent | df5f69444e438a7cd8d8ab4971579bf309b72114 (diff) | |
download | candle-ff03fd3fb314980d3273ffc49826d764541d76e2.tar.gz candle-ff03fd3fb314980d3273ffc49826d764541d76e2.tar.bz2 candle-ff03fd3fb314980d3273ffc49826d764541d76e2.zip |
Expose some helper functions to create quantized models. (#1837)
Diffstat (limited to 'candle-transformers/src/quantized_nn.rs')
-rw-r--r-- | candle-transformers/src/quantized_nn.rs | 8 |
1 files changed, 8 insertions, 0 deletions
diff --git a/candle-transformers/src/quantized_nn.rs b/candle-transformers/src/quantized_nn.rs index 21c88430..bb0a8641 100644 --- a/candle-transformers/src/quantized_nn.rs +++ b/candle-transformers/src/quantized_nn.rs @@ -35,6 +35,14 @@ pub struct Linear { } impl Linear { + pub fn from_arc( + weight: std::sync::Arc<candle::quantized::QTensor>, + bias: Option<Tensor>, + ) -> Result<Self> { + let weight = QMatMul::from_weights(weight)?; + Ok(Self { weight, bias }) + } + pub fn from_weights(weight: QMatMul, bias: Option<Tensor>) -> Self { Self { weight, bias } } |