summaryrefslogtreecommitdiff
path: root/candle-core/src/quantized/ggml_file.rs
diff options
context:
space:
mode:
Diffstat (limited to 'candle-core/src/quantized/ggml_file.rs')
-rw-r--r--candle-core/src/quantized/ggml_file.rs11
1 files changed, 2 insertions, 9 deletions
diff --git a/candle-core/src/quantized/ggml_file.rs b/candle-core/src/quantized/ggml_file.rs
index e6f5791c..99200bbd 100644
--- a/candle-core/src/quantized/ggml_file.rs
+++ b/candle-core/src/quantized/ggml_file.rs
@@ -1,7 +1,5 @@
//! Support for the GGML file format.
-#[cfg(feature = "metal")]
-use super::metal::load_quantized_metal;
use super::{k_quants, GgmlDType, QStorage};
use crate::{Device, Result};
use byteorder::{LittleEndian, ReadBytesExt};
@@ -130,13 +128,8 @@ fn from_raw_data<T: super::GgmlType + Send + Sync + 'static>(
let data = unsafe { std::slice::from_raw_parts(raw_data_ptr as *const T, n_blocks) };
let data: QStorage = match device {
Device::Cpu => QStorage::Cpu(Box::new(data.to_vec())),
- #[cfg(feature = "metal")]
- Device::Metal(metal) => load_quantized_metal(metal, data)?,
- #[cfg(not(feature = "metal"))]
- Device::Metal(_metal) => {
- crate::bail!("Metal backend requires `metal` feature")
- }
- device => unimplemented!("Implement quantized tensor for device {device:?}"),
+ Device::Metal(metal) => super::metal::load_quantized(metal, data)?,
+ Device::Cuda(cuda) => super::cuda::load_quantized(cuda, data)?,
};
super::QTensor::new(data, dims)
}