summaryrefslogtreecommitdiff
path: root/candle-metal-kernels
diff options
context:
space:
mode:
authorLaurent Mazare <laurent.mazare@gmail.com>2024-11-12 17:10:12 +0100
committerGitHub <noreply@github.com>2024-11-12 17:10:12 +0100
commit06350c31c780d6ea485f506032aea6ff8809e38a (patch)
tree811d3bd8443335b93f17d547d3abb5a9b3fc6ffd /candle-metal-kernels
parent9453cc30958dd0e9209aaeba30b15bb97aff0ea9 (diff)
downloadcandle-06350c31c780d6ea485f506032aea6ff8809e38a.tar.gz
candle-06350c31c780d6ea485f506032aea6ff8809e38a.tar.bz2
candle-06350c31c780d6ea485f506032aea6ff8809e38a.zip
Add some missing index-select metal kernels. (#2613)
* Add some missing index-select metal kernels. * Make some matrix contiguous pre-matmul.
Diffstat (limited to 'candle-metal-kernels')
-rw-r--r--candle-metal-kernels/src/indexing.metal4
1 files changed, 4 insertions, 0 deletions
diff --git a/candle-metal-kernels/src/indexing.metal b/candle-metal-kernels/src/indexing.metal
index 9eee97ca..c14f2c1f 100644
--- a/candle-metal-kernels/src/indexing.metal
+++ b/candle-metal-kernels/src/indexing.metal
@@ -193,12 +193,16 @@ INDEX_OP(is_i64_f16, int64_t, half)
INDEX_OP(is_i64_bf16, int64_t, bfloat)
#endif
+INDEX_OP(is_u32_u8, uint32_t, uint8_t)
+INDEX_OP(is_u32_u32, uint32_t, uint32_t)
INDEX_OP(is_u32_f32, uint32_t, float)
INDEX_OP(is_u32_f16, uint32_t, half)
#if defined(__HAVE_BFLOAT__)
INDEX_OP(is_u32_bf16, uint32_t, bfloat)
#endif
+INDEX_OP(is_u8_u8, uint8_t, uint8_t)
+INDEX_OP(is_u8_u32, uint8_t, uint32_t)
INDEX_OP(is_u8_f32, uint8_t, float)
INDEX_OP(is_u8_f16, uint8_t, half)
#if defined(__HAVE_BFLOAT__)