2024-07-23 16:32:09 +08:00
|
|
|
// Copyright (c) 2024, Tri Dao.
|
2023-07-17 20:26:11 +08:00
|
|
|
// Splitting the different head dimensions to different files to speed up compilation.
|
2023-08-29 04:33:37 +08:00
|
|
|
// This file is auto-generated. See "generate_kernels.py"
|
2023-07-17 20:26:11 +08:00
|
|
|
|
|
|
|
|
#include "flash_fwd_launch_template.h"
|
|
|
|
|
|
2023-08-29 04:33:37 +08:00
|
|
|
template<>
|
2024-07-10 15:24:04 +08:00
|
|
|
void run_mha_fwd_<cutlass::half_t, 96, false>(Flash_fwd_params ¶ms, cudaStream_t stream) {
|
|
|
|
|
run_mha_fwd_hdim96<cutlass::half_t, false>(params, stream);
|
2023-08-29 04:33:37 +08:00
|
|
|
}
|