summaryrefslogtreecommitdiff
path: root/candle-core/src/quantized/cuda.rs
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2024-04-01 10:00:11 +0200
committerGitHub <noreply@github.com>2024-04-01 10:00:11 +0200
commitc7557b65dcccbb45e53695db71e8d7c1bfd38dc2 (patch)
tree2aa4b7e6cba34d47ac275d269b0b9a6d50b2ff8b /candle-core/src/quantized/cuda.rs
parentcd29c7ccd420a840d883361c290ee92d06b9b96c (diff)
downloadcandle-c7557b65dcccbb45e53695db71e8d7c1bfd38dc2.tar.gz
candle-c7557b65dcccbb45e53695db71e8d7c1bfd38dc2.tar.bz2
candle-c7557b65dcccbb45e53695db71e8d7c1bfd38dc2.zip
Switch the default to using the faster kernels. (#1978)
* Switch the default to using the faster kernels. * Add the force-dmmv flag.
Diffstat (limited to 'candle-core/src/quantized/cuda.rs')
-rw-r--r--candle-core/src/quantized/cuda.rs2
1 files changed, 1 insertions, 1 deletions
diff --git a/candle-core/src/quantized/cuda.rs b/candle-core/src/quantized/cuda.rs
index a8f0d622..64404beb 100644
--- a/candle-core/src/quantized/cuda.rs
+++ b/candle-core/src/quantized/cuda.rs
@@ -10,7 +10,7 @@ pub struct QCudaStorage {
device: CudaDevice,
}
-static FORCE_DMMV: std::sync::atomic::AtomicBool = std::sync::atomic::AtomicBool::new(true);
+static FORCE_DMMV: std::sync::atomic::AtomicBool = std::sync::atomic::AtomicBool::new(false);
pub fn set_force_dmmv(f: bool) {
FORCE_DMMV.store(f, std::sync::atomic::Ordering::Relaxed)