summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorLuka Zakrajšek <luka@bancek.net>2025-01-04 16:11:20 +0100
committerGitHub <noreply@github.com>2025-01-04 16:11:20 +0100
commit57f41da13b10d909b85b7c335050e14fdb5b0d9b (patch)
tree4b3d43b367d9bc1ba994c86f9bfe41d279bfa550
parentcbaa0ad46f0eda2f3d9bcf8a42d6271e6760e578 (diff)
downloadcandle-57f41da13b10d909b85b7c335050e14fdb5b0d9b.tar.gz
candle-57f41da13b10d909b85b7c335050e14fdb5b0d9b.tar.bz2
candle-57f41da13b10d909b85b7c335050e14fdb5b0d9b.zip
Fix mistral attention on Metal (#2699)
Co-authored-by: Luka Zakrajsek <luka.zakrajsek@soniox.com>
-rw-r--r--candle-transformers/src/models/mistral.rs3
1 files changed, 2 insertions, 1 deletions
diff --git a/candle-transformers/src/models/mistral.rs b/candle-transformers/src/models/mistral.rs
index f927f88b..8df73d61 100644
--- a/candle-transformers/src/models/mistral.rs
+++ b/candle-transformers/src/models/mistral.rs
@@ -262,7 +262,8 @@ impl Attention {
.contiguous()?;
let value_states = value_states
.reshape((b_sz, q_len, self.num_kv_heads, self.head_dim))?
- .transpose(1, 2)?;
+ .transpose(1, 2)?
+ .contiguous()?;
let (query_states, key_states) =
self.rotary_emb