summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorNicolas Patry <patry.nicolas@protonmail.com>2023-08-10 16:23:17 +0200
committerGitHub <noreply@github.com>2023-08-10 16:23:17 +0200
commit0b0fa56978b9fe722250d52c87cf39f9d8b2acdb (patch)
treeeed0d5d77bff6a26d756d387b0a14f282eaa109b
parent385f0d261c9199b83373fc10b7b52a1fef67a9d0 (diff)
parent66d1c093e029e789ab66acc0b747643cb7b05ffa (diff)
downloadcandle-0b0fa56978b9fe722250d52c87cf39f9d8b2acdb.tar.gz
candle-0b0fa56978b9fe722250d52c87cf39f9d8b2acdb.tar.bz2
candle-0b0fa56978b9fe722250d52c87cf39f9d8b2acdb.zip
Merge pull request #386 from huggingface/enabling_61_maybe
This is duplicated code on Cuda 12.2.
-rw-r--r--candle-kernels/src/compatibility.cuh18
1 files changed, 0 insertions, 18 deletions
diff --git a/candle-kernels/src/compatibility.cuh b/candle-kernels/src/compatibility.cuh
index 2df8e921..5a22f4bc 100644
--- a/candle-kernels/src/compatibility.cuh
+++ b/candle-kernels/src/compatibility.cuh
@@ -6,24 +6,6 @@
// FIXME: the minimum compute capabilities are just guesses since the table is not specific enough
-// #if __CUDA_ARCH__ < 600
-// __device__ __forceinline__ __half __hmax(__half a, __half b) {
-// return __float2half(fmaxf(__half2float(a), __half2float(b)));
-// }
-// __device__ __forceinline__ __half __hmin(__half a, __half b) {
-// return __float2half(fminf(__half2float(a), __half2float(b)));
-// }
-// #endif
-
-#if __CUDA_ARCH__ < 800
-__device__ __forceinline__ __half __hmax_nan(__half a, __half b) {
- // return __hisnan(a) ? a : (__hisnan(b) ? b : __hmax(a, b));
-}
-__device__ __forceinline__ __half __hmin_nan(__half a, __half b) {
- // return __hisnan(a) ? a : (__hisnan(b) ? b : __hmin(a, b));
-}
-#endif
-
#if __CUDA_ARCH__ < 600
// Copied from https://docs.nvidia.com/cuda/cuda-c-programming-guide/#atomic-functions
__device__ double atomicAdd(double* address, double val) {