WIP because there seems to be some race conditions for head dimensions other than 16, 32, 64, 128. |
||
|---|---|---|
| .. | ||
| utils | ||
| __init__.py | ||
| bert_padding.py | ||
| flash_attention.py | ||
| flash_attn_interface.py | ||
| flash_attn_triton_og.py | ||
| flash_attn_triton.py | ||
| flash_blocksparse_attention.py | ||
| flash_blocksparse_attn_interface.py | ||
| fused_softmax.py | ||
| rotary.py | ||