| .. |
|
alibi.h
|
Clean up alibi, implement non-causal alibi
|
2023-12-21 22:27:40 -08:00 |
|
block_info.h
|
Allow varlen_fwd to take optional seqused_k (#647)
|
2023-11-27 00:41:23 -08:00 |
|
dropout.h
|
Move dropout to a separate file (dropout.h)
|
2024-01-14 12:19:17 -08:00 |
|
flash_bwd_hdim32_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim32_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim64_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim64_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim96_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim96_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim128_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim128_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim160_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim160_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim192_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim192_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim224_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim224_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim256_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_hdim256_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_bwd_kernel.h
|
Move dropout to a separate file (dropout.h)
|
2024-01-14 12:19:17 -08:00 |
|
flash_bwd_launch_template.h
|
Implement deterministic backward (thanks to Meituan)
|
2023-12-23 17:57:36 -08:00 |
|
flash_fwd_hdim32_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim32_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim64_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim64_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim96_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim96_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim128_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim128_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim160_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim160_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim192_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim192_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim224_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim224_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim256_bf16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_hdim256_fp16_sm80.cu
|
Use generate_kernels.py script from Driss Guessous
|
2023-08-28 13:34:12 -07:00 |
|
flash_fwd_kernel.h
|
Move dropout to a separate file (dropout.h)
|
2024-01-14 12:19:17 -08:00 |
|
flash_fwd_launch_template.h
|
Implement deterministic backward (thanks to Meituan)
|
2023-12-23 17:57:36 -08:00 |
|
flash_fwd_split_hdim32_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim32_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim64_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim64_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim96_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim96_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim128_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim128_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim160_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim160_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim192_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim192_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim224_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim224_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim256_bf16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash_fwd_split_hdim256_fp16_sm80.cu
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
flash.h
|
Implement deterministic backward (thanks to Meituan)
|
2023-12-23 17:57:36 -08:00 |
|
generate_kernels.py
|
Implement splitKV attention
|
2023-08-29 00:58:29 -07:00 |
|
kernel_traits_sm90.h
|
FlashAttention-2 release
|
2023-07-17 06:21:34 -07:00 |
|
kernel_traits.h
|
Simplify writing softmax to gmem
|
2024-01-13 00:25:04 -08:00 |
|
philox.cuh
|
Remove dead code in philox.cuh
|
2024-01-13 02:02:03 -08:00 |
|
softmax.h
|
Move dropout to a separate file (dropout.h)
|
2024-01-14 12:19:17 -08:00 |
|
static_switch.h
|
Fix compile error on MSVC
|
2023-07-19 08:04:57 +00:00 |
|
utils.h
|
apply_dropout now takes tensor of rowcol layout
|
2024-01-14 01:03:23 -08:00 |