diff options
Diffstat (limited to 'candle-flash-attn/kernels/flash_fwd_hdim96_bf16_sm80.cu')
-rw-r--r-- | candle-flash-attn/kernels/flash_fwd_hdim96_bf16_sm80.cu | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/candle-flash-attn/kernels/flash_fwd_hdim96_bf16_sm80.cu b/candle-flash-attn/kernels/flash_fwd_hdim96_bf16_sm80.cu index 9c003540..e696b2f2 100644 --- a/candle-flash-attn/kernels/flash_fwd_hdim96_bf16_sm80.cu +++ b/candle-flash-attn/kernels/flash_fwd_hdim96_bf16_sm80.cu @@ -5,6 +5,6 @@ #include "flash_fwd_launch_template.h" template<> -void run_mha_fwd_<cutlass::bfloat16_t, 96>(Flash_fwd_params ¶ms, cudaStream_t stream) { - run_mha_fwd_hdim96<cutlass::bfloat16_t>(params, stream); +void run_mha_fwd_<cutlass::bfloat16_t, 96, false>(Flash_fwd_params ¶ms, cudaStream_t stream) { + run_mha_fwd_hdim96<cutlass::bfloat16_t, false>(params, stream); } |