summaryrefslogtreecommitdiff
path: root/candle-flash-attn/kernels/alibi.h
diff options
context:
space:
mode:
authorZhuo Jinggang <jg.zhuo@outlook.com>2024-07-12 16:00:03 +0800
committerGitHub <noreply@github.com>2024-07-12 10:00:03 +0200
commitc63048d3748649c6f13148eb01e6d812d897a0d2 (patch)
tree275f50476521bf47bb89530dd822a45ae776e6d3 /candle-flash-attn/kernels/alibi.h
parenta226a9736baee550b01de53cb3e416d3d94e69d3 (diff)
downloadcandle-c63048d3748649c6f13148eb01e6d812d897a0d2.tar.gz
candle-c63048d3748649c6f13148eb01e6d812d897a0d2.tar.bz2
candle-c63048d3748649c6f13148eb01e6d812d897a0d2.zip
add quantized qwen2 (#2329)
* add quantized version of qwen2 and corresponding example for qwen2-instruct * fix quantized qwen2 clippy error
Diffstat (limited to 'candle-flash-attn/kernels/alibi.h')
0 files changed, 0 insertions, 0 deletions