diff --git a/README.md b/README.md index 0fecdee2..bae618f8 100644 --- a/README.md +++ b/README.md @@ -112,7 +112,7 @@ any Volta-, Turing-, or NVIDIA Ampere- architecture NVIDIA GPU. |NVIDIA A100|8.0|11.0|11.0| |NVIDIA A10 |8.6|11.1|11.1| |NVIDIA GeForce 3090|8.6|11.1|11.1| -|NVIDIA H100 PCIe|9.0|11.8|11.8| +|NVIDIA H100 PCIe|9.0|11.8|Double-precision: 11.8| # Documentation diff --git a/include/cutlass/epilogue/threadblock/epilogue.h b/include/cutlass/epilogue/threadblock/epilogue.h index d334702b..91005832 100644 --- a/include/cutlass/epilogue/threadblock/epilogue.h +++ b/include/cutlass/epilogue/threadblock/epilogue.h @@ -62,7 +62,6 @@ #include "cutlass/epilogue/threadblock/epilogue_base.h" #include "cutlass/epilogue/threadblock/epilogue_base_streamk.h" #include "cutlass/epilogue/threadblock/predicated_tile_iterator.h" -#include "cutlass/util/index_sequence.h" //////////////////////////////////////////////////////////////////////////////// diff --git a/tools/util/include/cutlass/util/reference/host/gemm_complex.h b/tools/util/include/cutlass/util/reference/host/gemm_complex.h index 37221b09..98c7aa5d 100644 --- a/tools/util/include/cutlass/util/reference/host/gemm_complex.h +++ b/tools/util/include/cutlass/util/reference/host/gemm_complex.h @@ -39,6 +39,7 @@ #include "cutlass/numeric_types.h" #include "cutlass/functional.h" #include "cutlass/numeric_conversion.h" +#include "cutlass/matrix_coord.h" #include "cutlass/tensor_view.h" #include "cutlass/gemm/gemm.h"