Import torch before flash_attn_2_cuda

2023-08-19 21:07:33 -07:00 · 2023-08-19 21:07:33 -07:00 · d431f16751
commit d431f16751
parent 0e8c46ae08
1 changed files with 5 additions and 1 deletions
--- a/flash_attn/flash_attn_interface.py
+++ b/flash_attn/flash_attn_interface.py
@ -1,8 +1,12 @@
 import flash_attn_2_cuda as flash_attn_cuda
 import torch
 import torch.nn as nn
 from einops import rearrange
 # isort: off
 # We need to import the CUDA kernels after importing torch
 import flash_attn_2_cuda as flash_attn_cuda
 # isort: on
 def _get_block_size(device, head_dim, is_dropout, is_causal):
    # This should match the block sizes in the CUDA kernel