CUTLASS 2.7 (#318)

CUTLASS 2.7

Mainloop fusion for GEMM: summation over A or B
Strided DGRAD (optimized iterators)
Half-precision GELU_taylor activation functions
Use these when accumulation and epilogue compute types are all cutlass::half_t
Tuning and bug fixes to fused GEMM + GEMM example
Support for smaller than 128b aligned Convolutions: see examples
Caching of results to accelerate Convolution unit tests
Can be enabled or disabled by running cmake .. -DCUTLASS_TEST_ENABLE_CACHED_RESULTS=OFF
Corrections and bug fixes reported by the CUTLASS community
Thank you for filing these issues!

authored-by: Haicheng Wu haichengw@nvidia.com, Manish Gupta manigupta@nvidia.com, Dustyn Blasig dblasig@nvidia.com, Andrew Kerr akerr@nvidia.com
This commit is contained in:
Manish Gupta 2021-09-20 11:02:22 -07:00 committed by GitHub
parent 9ac255863f
commit 2e07c4cc2f
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
62 changed files with 5611 additions and 186 deletions

View File

@ -1,6 +1,16 @@
# NVIDIA CUTLASS Changelog
# CUTLASS 2.x
## [2.7.0](https://github.com/NVIDIA/cutlass/releases/tag/v2.7.0) (2021-09-24)
* Mainloop fusion for GEMM: [summation over A or B](/examples/23_ampere_gemm_operand_reduction_fusion/ampere_gemm_operand_reduction_fusion.cu)
* [Strided DGRAD (optimized iterators)](/include/cutlass/conv/kernel/default_conv2d_dgrad.h)
* [Half-precision GELU_taylor activation functions](/include/cutlass/epilogue/thread/activation.h#L196)
* Use these when accumulation and epilogue compute types are all `cutlass::half_t`
* Tuning and bug fixes to [fused GEMM + GEMM example](/examples/13_two_tensor_op_fusion/)
* Support for smaller than 128b aligned Convolutions: [see examples](test/unit/conv/device/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.cu#L272)
* Caching of results to accelerate Convolution [unit tests](test/unit/conv/device/cache_testbed_output.h)
* Can be enabled or disabled by running `cmake .. -DCUTLASS_TEST_ENABLE_CACHED_RESULTS=OFF`
* Corrections and bug fixes reported by the CUTLASS community
* Thank you for filing these issues!
## [2.6.1](https://github.com/NVIDIA/cutlass/releases/tag/v2.6.1) (2021-09-03)
* Arbitrary padding and striding for CUTLASS Strided DGRAD Convolution operator (Analytic Iterators)

View File

@ -32,7 +32,7 @@ endif()
message(STATUS "CMake Version: ${CMAKE_VERSION}")
project(CUTLASS VERSION 2.6.0 LANGUAGES CXX)
project(CUTLASS VERSION 2.7.0 LANGUAGES CXX)
include(${CMAKE_CURRENT_SOURCE_DIR}/CUDA.cmake)
if (CUDA_VERSION VERSION_LESS 10.2)
@ -188,10 +188,18 @@ set(CUTLASS_LIBRARY_IGNORE_KERNELS "" CACHE STRING "Comma delimited list of kern
# Test Levels L0, L1, L2
set(CUTLASS_TEST_LEVEL "0" CACHE STRING "Level of tests to compile.")
set(CUTLASS_TEST_ENABLE_CACHED_RESULTS ON CACHE BOOL "Enable caching and reuse of test results in unit tests")
set_property(CACHE CUTLASS_TEST_LEVEL PROPERTY STRINGS 0 1 2)
list(APPEND CUTLASS_CUDA_NVCC_FLAGS -DCUTLASS_TEST_LEVEL=${CUTLASS_TEST_LEVEL})
list(APPEND CUTLASS_CUDA_CLANG_FLAGS -DCUTLASS_TEST_LEVEL=${CUTLASS_TEST_LEVEL})
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS)
list(APPEND CUTLASS_CUDA_NVCC_FLAGS -DCUTLASS_TEST_ENABLE_CACHED_RESULTS=1)
endif()
#
# CUDA 10.1 introduces "mma" in PTX performing collective matrix multiply operations.
#
@ -244,7 +252,7 @@ if (NOT MSVC AND CUTLASS_NVCC_KEEP)
# MSVC flow handles caching already, but for other generators we handle it here.
set(CUTLASS_NVCC_KEEP_DIR ${CMAKE_CURRENT_BINARY_DIR}/tmp CACHE PATH "Location to store NVCC scratch files")
file(MAKE_DIRECTORY ${CUTLASS_NVCC_KEEP_DIR})
list(APPEND CUTLASS_CUDA_NVCC_FLAGS --keep) # --keep-dir may not work with nvcc for some directories.
list(APPEND CUTLASS_CUDA_NVCC_FLAGS --keep -v) # --keep-dir may not work with nvcc for some directories.
list(APPEND CUTLASS_CUDA_CLANG_FLAGS -save-temps=${CUTLASS_NVCC_KEEP_DIR})
endif()
@ -572,10 +580,12 @@ function(cutlass_add_executable_tests NAME TARGET)
# TEST_COMMAND_OPTIONS: A list of variables (i.e. by reference params) which contain command line arguments
# to pass to the test executable. A unique test with suffix _0, _1, ... is generated for each set of
# options given. If this option is not used, a single test with no arguments is generated.
# RESULT_CACHE_FILE: A file to be installed alongside the test executable with pre-computed
# test results to speed up test runtime.
#
set(options DISABLE_EXECUTABLE_INSTALL_RULE)
set(oneValueArgs DISABLE_TESTS)
set(oneValueArgs DISABLE_TESTS RESULT_CACHE_FILE)
set(multiValueArgs DEPENDS DEPENDEES TEST_COMMAND_OPTIONS)
cmake_parse_arguments(_ "${options}" "${oneValueArgs}" "${multiValueArgs}" ${ARGN})
@ -583,6 +593,17 @@ function(cutlass_add_executable_tests NAME TARGET)
set(__DISABLE_TESTS OFF)
endif()
if (__RESULT_CACHE_FILE)
add_custom_command(
TARGET ${TARGET}
POST_BUILD
COMMAND ${CMAKE_COMMAND}
ARGS -E copy ${__RESULT_CACHE_FILE} "$<TARGET_FILE_DIR:${TARGET}>"
)
endif()
if (NOT __DISABLE_EXECUTABLE_INSTALL_RULE AND CUTLASS_INSTALL_TESTS)
# file(RELATIVE_PATH CMAKE_CURRENT_BINARY_RELATIVE_DIR ${CMAKE_BINARY_DIR} ${CMAKE_CURRENT_BINARY_DIR})
@ -591,6 +612,15 @@ function(cutlass_add_executable_tests NAME TARGET)
TARGETS ${TARGET}
RUNTIME DESTINATION ${CUTLASS_TEST_INSTALL_BINDIR}
)
if (__RESULT_CACHE_FILE)
install(
FILES ${__RESULT_CACHE_FILE}
DESTINATION ${CUTLASS_TEST_INSTALL_BINDIR}/
)
endif()
endif()

View File

@ -1,15 +1,15 @@
![ALT](/media/images/gemm-hierarchy-with-epilogue-no-labels.png "Complete CUDA GEMM decomposition")
# CUTLASS 2.6
# CUTLASS 2.7
_CUTLASS 2.6.1 - September 2021_
_CUTLASS 2.7 - September 2021_
CUTLASS is a collection of CUDA C++ template abstractions for implementing
high-performance matrix-multiplication (GEMM) at all levels and scales within CUDA.
It incorporates strategies for hierarchical decomposition and data movement similar
to those used to implement cuBLAS. CUTLASS decomposes these "moving parts" into
reusable, modular software components abstracted by C++ template classes. These
thread-wide, warp-wide, block-wide, and device-wide primitives can be specialized
high-performance matrix-multiplication (GEMM) and related computations at all levels
and scales within CUDA. It incorporates strategies for hierarchical decomposition and
data movement similar to those used to implement cuBLAS and cuDNN. CUTLASS decomposes
these "moving parts" into reusable, modular software components abstracted by C++ template
classes. These thread-wide, warp-wide, block-wide, and device-wide primitives can be specialized
and tuned via custom tiling sizes, data types, and other algorithmic policy. The
resulting flexibility simplifies their use as building blocks within custom kernels
and applications.
@ -20,14 +20,14 @@ multiply-accumulate abstractions for half-precision floating
point (FP16), BFloat16 (BF16), Tensor Float 32 (TF32),
single-precision floating point (FP32), double-precision floating
point (FP64) types, integer data types (4b and 8b), and binary data types (1b).
Furthermore, CUTLASS demonstrates warp-synchronous matrix multiply operations
CUTLASS demonstrates warp-synchronous matrix multiply operations
targeting the programmable, high-throughput _Tensor Cores_ implemented by
NVIDIA's Volta, Turing, and Ampere architectures.
Additionaly, CUTLASS implements high-performance convolution (implicit GEMM).
Implicit GEMM is the formulation of a convolution operation as a GEMM. This allows CUTLASS
to build convolutions by reusing highly optimized warp-wide GEMM components and below.
CUTLASS implements high-performance Convolution via the implicit GEMM algorithm.
Implicit GEMM is the formulation of a convolution operation as a GEMM thereby taking advantage of
CUTLASS's modular GEMM pipeline.
This allows CUTLASS to build convolutions by reusing highly optimized warp-wide GEMM components and below.
See the [Quick Start Guide](/media/docs/quickstart.md) to get started quickly.
@ -36,6 +36,16 @@ supported at each level of the execution model hierarchy.
See the [CHANGELOG](CHANGELOG.md) for descriptions of recent updates.
# What's New in CUTLASS 2.7
CUTLASS 2.7 is a minor update to CUTLASS adding:
- Mainloop fusion for GEMM: [summation over A or B](/examples/23_ampere_gemm_operand_reduction_fusion/ampere_gemm_operand_reduction_fusion.cu)
- [Optimizations for strided DGRAD](/include/cutlass/conv/kernel/default_conv2d_dgrad.h)
- [Half-precision GELU_taylor activation functions](/include/cutlass/epilogue/thread/activation.h#L196)
- Tuning and bug fixes to [fused GEMM + GEMM example](/examples/13_two_tensor_op_fusion/)
- Support for smaller than 128b aligned Convolutions: [see examples](test/unit/conv/device/conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.cu#L272)
- Caching of results to accelerate Convolution [unit tests](test/unit/conv/device/cache_testbed_output.h)
- Numerous updates from the community (thanks!)
# What's New in CUTLASS 2.6
CUTLASS 2.6 is a minor update to CUTLASS adding:
- Fused [broadcast](test/unit/gemm/device/gemm_with_broadcast_f16n_f16n_f16n_tensorop_f32_sm75.cu) and [reductions](/test/unit/gemm/device/gemm_with_reduction_f16n_f16n_f16n_tensorop_f32_sm75.cu) in the epilogues of GEMM and Convolution

View File

@ -21,7 +21,7 @@
# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
set(TEST_COMMAND_00 RowMajor --extent=16,16)
set(TEST_COMMAND_01 "ColumnMajorInterleaved<4>" --extent=32,8 --output-shape=16 --vectorize=4)
set(TEST_COMMAND_01 \"ColumnMajorInterleaved<4>\" --extent=32,8 --output-shape=16 --vectorize=4)
cutlass_example_add_executable(
03_visualize_layout

View File

@ -225,6 +225,34 @@ struct global_store;
//
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename AccessType>
struct global_store<AccessType, 64> {
CUTLASS_DEVICE
global_store(AccessType const &D, void *ptr, bool pred_guard) {
uint4 const *data = reinterpret_cast<uint4 const *>(&D);
asm volatile(
"{\n"
" .reg .pred p;\n"
" setp.ne.b32 p, %5, 0;\n"
" @p st.global.v4.u32 [%0], {%1, %2, %3, %4};\n"
" @p st.global.v4.u32 [%6], {%7, %8, %9, %10};\n"
" @p st.global.v4.u32 [%11], {%12, %13, %14, %15};\n"
" @p st.global.v4.u32 [%16], {%17, %18, %19, %20};\n"
"}\n"
:
: "l"(ptr), "r"(data[0].x), "r"(data[0].y), "r"(data[0].z),
"r"(data[0].w), "r"((int)pred_guard), "l"(((uint8_t *)ptr) + 16),
"r"(data[1].x), "r"(data[1].y), "r"(data[1].z), "r"(data[1].w),
"l"(((uint8_t *)ptr) + 32),
"r"(data[2].x), "r"(data[2].y), "r"(data[2].z), "r"(data[2].w),
"l"(((uint8_t *)ptr) + 48),
"r"(data[3].x), "r"(data[3].y), "r"(data[3].z), "r"(data[2].w));
}
};
template <typename AccessType>
struct global_store<AccessType, 32> {
CUTLASS_DEVICE

View File

@ -65,7 +65,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided,
/// Access granularity of A matrix in units of elements
int AlignmentA = 128 / cutlass::sizeof_bits<ElementA>::value,
@ -675,6 +675,243 @@ struct DefaultConv2dDgrad <
>;
};
/// Defines a kernel for Conv2dDgrad specialzation for Optimized IteratorAlgorithm Dgrad Strided and
// multistage pipeline.
template <
typename ElementA,
typename LayoutA,
typename ElementB,
typename LayoutB,
typename ElementC,
typename LayoutC,
typename ElementAccumulator,
typename ArchTag,
typename ThreadblockShape,
typename WarpShape,
typename InstructionShape,
typename EpilogueOutputOp,
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
int AlignmentA,
int AlignmentB
>
struct DefaultConv2dDgrad <
ElementA,
LayoutA,
ElementB,
LayoutB,
ElementC,
LayoutC,
ElementAccumulator,
arch::OpClassTensorOp,
ArchTag,
ThreadblockShape,
WarpShape,
InstructionShape,
EpilogueOutputOp,
ThreadblockSwizzle,
Stages,
MathOperatorTag,
IteratorAlgorithm::kOptimized,
StrideSupport::kStrided,
AlignmentA,
AlignmentB
> {
// Define the core components from GEMM
using MmaCore = typename cutlass::gemm::threadblock::DefaultMmaCore<
ThreadblockShape, WarpShape, InstructionShape, ElementA, layout::RowMajor,
ElementB, layout::RowMajor, ElementAccumulator, layout::RowMajor, arch::OpClassTensorOp,
Stages, MathOperatorTag>;
// Define iterators over tiles from the A operand
using ThreadMapA = typename MmaCore::IteratorThreadMapA;
using AccessTypeA = cutlass::AlignedArray<ElementA, AlignmentA>;
using IteratorA =
cutlass::conv::threadblock::Conv2dDgradOutputGradientTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kM, ThreadblockShape::kK>,
ElementA,
ThreadMapA,
StrideSupport::kStrided,
AccessTypeA
>;
using SmemIteratorA = typename MmaCore::SmemIteratorA;
// Define iterators over tiles from the B operand
using ThreadMapB = typename MmaCore::IteratorThreadMapB;
using AccessTypeB = cutlass::AlignedArray<ElementB, AlignmentB>;
using IteratorB =
cutlass::conv::threadblock::Conv2dDgradFilterTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kK, ThreadblockShape::kN>,
ElementB,
ThreadMapB,
StrideSupport::kStrided,
AccessTypeB
>;
using SmemIteratorB = typename MmaCore::SmemIteratorB;
// Warp-level GEMM components
using WarpMmaTensorOp = typename MmaCore::MmaTensorOp;
using MmaPolicy = typename MmaCore::MmaPolicy;
static cutlass::arch::CacheOperation::Kind const CacheOpB =
((sizeof_bits<ElementB>::value * AlignmentB) == 128)
? cutlass::arch::CacheOperation::Global
: cutlass::arch::CacheOperation::Always;
// Define the Mma
using Mma = threadblock::ImplicitGemmMultistage<
ThreadblockShape,
IteratorA,
SmemIteratorA,
arch::CacheOperation::Always,
IteratorB,
SmemIteratorB,
CacheOpB,
MmaPolicy,
Stages
>;
static const int kPartitionsK = ThreadblockShape::kK / WarpShape::kK;
// Define the epilogue
using Epilogue = typename epilogue::threadblock::DefaultEpilogueTensorOpStridedDgrad<
ThreadblockShape,
WarpMmaTensorOp,
kPartitionsK,
EpilogueOutputOp,
EpilogueOutputOp::kCount
>::Epilogue;
// Define the kernel
using Kernel = cutlass::conv::kernel::ImplicitGemmConvolutionStridedDgrad<
Mma,
Epilogue,
ThreadblockSwizzle,
conv::Operator::kDgrad
>;
};
/// Defines a kernel for Conv2dDgrad specialzation for Optimized IteratorAlgorithm Dgrad Strided
// and 2 stage pipeline.
template <
typename ElementA,
typename LayoutA,
typename ElementB,
typename LayoutB,
typename ElementC,
typename LayoutC,
typename ElementAccumulator,
typename ArchTag,
typename ThreadblockShape,
typename WarpShape,
typename InstructionShape,
typename EpilogueOutputOp,
typename ThreadblockSwizzle,
typename MathOperatorTag,
int AlignmentA,
int AlignmentB
>
struct DefaultConv2dDgrad <
ElementA,
LayoutA,
ElementB,
LayoutB,
ElementC,
LayoutC,
ElementAccumulator,
arch::OpClassTensorOp,
ArchTag,
ThreadblockShape,
WarpShape,
InstructionShape,
EpilogueOutputOp,
ThreadblockSwizzle,
2,
MathOperatorTag,
IteratorAlgorithm::kOptimized,
StrideSupport::kStrided,
AlignmentA,
AlignmentB
> {
// Define the core components from GEMM
using MmaCore = typename cutlass::gemm::threadblock::DefaultMmaCore<
ThreadblockShape, WarpShape, InstructionShape, ElementA, layout::RowMajor,
ElementB, layout::RowMajor, ElementAccumulator, layout::RowMajor, arch::OpClassTensorOp,
2, MathOperatorTag>;
// Define iterators over tiles from the A operand
using ThreadMapA = typename MmaCore::IteratorThreadMapA;
using AccessTypeA = cutlass::AlignedArray<ElementA, AlignmentA>;
using IteratorA =
cutlass::conv::threadblock::TileIteratorStridedDgrad<
cutlass::conv::threadblock::Conv2dDgradOutputGradientTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kM, ThreadblockShape::kK>,
ElementA,
ThreadMapA,
StrideSupport::kStrided,
AccessTypeA
>
>;
using SmemIteratorA = typename MmaCore::SmemIteratorA;
// Define iterators over tiles from the B operand
using ThreadMapB = typename MmaCore::IteratorThreadMapB;
using AccessTypeB = cutlass::AlignedArray<ElementB, AlignmentB>;
using IteratorB =
cutlass::conv::threadblock::TileIteratorStridedDgrad<
cutlass::conv::threadblock::Conv2dDgradFilterTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kK, ThreadblockShape::kN>,
ElementB,
ThreadMapB,
StrideSupport::kStrided,
AccessTypeB
>
>;
using SmemIteratorB = typename MmaCore::SmemIteratorB;
// Warp-level GEMM components
using WarpMmaTensorOp = typename MmaCore::MmaTensorOp;
using MmaPolicy = typename MmaCore::MmaPolicy;
// Define the Mma
using Mma = threadblock::ImplicitGemmPipelined<
ThreadblockShape,
IteratorA,
SmemIteratorA,
IteratorB,
SmemIteratorB,
ElementC,
LayoutC,
MmaPolicy
>;
static const int kPartitionsK = ThreadblockShape::kK / WarpShape::kK;
// Define the epilogue
using Epilogue = typename detail::DefaultConvEpilogueStridedDgrad<
ArchTag,
ThreadblockShape,
WarpMmaTensorOp,
kPartitionsK,
EpilogueOutputOp
>::Epilogue;
// Define the kernel
using Kernel = cutlass::conv::kernel::ImplicitGemmConvolutionStridedDgrad<
Mma,
Epilogue,
ThreadblockSwizzle,
conv::Operator::kDgrad
>;
};
/// Defines a kernel for Conv2dDgrad specialzation for Optimized IteratorAlgorithm Dgrad Unity
// 2 stage pipeline
template <
@ -1126,6 +1363,112 @@ struct DefaultConv2dDgrad <
};
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA,
typename LayoutA,
typename ElementB,
typename LayoutB,
typename ElementC,
typename LayoutC,
typename ElementAccumulator,
typename ArchTag,
typename ThreadblockShape,
typename WarpShape,
typename InstructionShape,
typename EpilogueOutputOp,
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
int AlignmentA,
int AlignmentB
>
struct DefaultConv2dDgrad <
ElementA,
LayoutA,
ElementB,
LayoutB,
ElementC,
LayoutC,
ElementAccumulator,
arch::OpClassSimt,
ArchTag,
ThreadblockShape,
WarpShape,
InstructionShape,
EpilogueOutputOp,
ThreadblockSwizzle,
Stages,
MathOperatorTag,
IteratorAlgorithm::kOptimized,
conv::StrideSupport::kStrided,
AlignmentA,
AlignmentB
> {
// Define the core components from GEMM
using MmaCore = typename cutlass::gemm::threadblock::DefaultMmaCore<
ThreadblockShape, WarpShape, InstructionShape, ElementA, layout::RowMajor,
ElementB, layout::RowMajor, ElementAccumulator, layout::RowMajor, arch::OpClassSimt,
Stages, MathOperatorTag>;
// Define iterators over tiles from the A operand
using ThreadMapA = typename MmaCore::IteratorThreadMapA;
using IteratorA =
cutlass::conv::threadblock::Conv2dDgradOutputGradientTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kM, ThreadblockShape::kK>,
ElementA,
ThreadMapA,
conv::StrideSupport::kStrided
>;
using SmemIteratorA = typename MmaCore::SmemIteratorA;
// Define iterators over tiles from the B operand
using ThreadMapB = typename MmaCore::IteratorThreadMapB;
using IteratorB =
cutlass::conv::threadblock::Conv2dDgradFilterTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kK, ThreadblockShape::kN>,
ElementB,
ThreadMapB,
conv::StrideSupport::kStrided
>;
using SmemIteratorB = typename MmaCore::SmemIteratorB;
// Warp-level GEMM components
using WarpMmaSimtOp = typename MmaCore::MmaWarpSimt;
using MmaPolicy = typename MmaCore::MmaPolicy;
// Define the Mma
using Mma = threadblock::ImplicitGemmMultistage<
ThreadblockShape,
IteratorA,
SmemIteratorA,
arch::CacheOperation::Always,
IteratorB,
SmemIteratorB,
arch::CacheOperation::Always,
MmaPolicy,
Stages
>;
// Define the epilogue
using Epilogue = typename epilogue::threadblock::DefaultEpilogueSimtStridedDgrad<
ThreadblockShape,
WarpMmaSimtOp,
EpilogueOutputOp,
EpilogueOutputOp::kCount
>::Epilogue;
// Define the kernel
using Kernel = cutlass::conv::kernel::ImplicitGemmConvolutionStridedDgrad<
Mma,
Epilogue,
ThreadblockSwizzle,
conv::Operator::kDgrad
>;
};
/////////////////////////////////////////////////////////////////////////////////////////////////
/// Defines a kernel for Conv2dDgrad specialzation for Analytic IteratorAlgorithm,
@ -1462,6 +1805,115 @@ struct DefaultConv2dDgrad <
};
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA,
typename LayoutA,
typename ElementB,
typename LayoutB,
typename ElementC,
typename LayoutC,
typename ElementAccumulator,
typename ArchTag,
typename ThreadblockShape,
typename WarpShape,
typename InstructionShape,
typename EpilogueOutputOp,
typename ThreadblockSwizzle,
typename MathOperatorTag,
int AlignmentA,
int AlignmentB
>
struct DefaultConv2dDgrad <
ElementA,
LayoutA,
ElementB,
LayoutB,
ElementC,
LayoutC,
ElementAccumulator,
arch::OpClassSimt,
ArchTag,
ThreadblockShape,
WarpShape,
InstructionShape,
EpilogueOutputOp,
ThreadblockSwizzle,
2,
MathOperatorTag,
IteratorAlgorithm::kOptimized,
conv::StrideSupport::kStrided,
AlignmentA,
AlignmentB
> {
// Define the core components from GEMM
using MmaCore = typename cutlass::gemm::threadblock::DefaultMmaCore<
ThreadblockShape, WarpShape, InstructionShape, ElementA, layout::RowMajor,
ElementB, layout::RowMajor, ElementAccumulator, layout::RowMajor, arch::OpClassSimt,
2, MathOperatorTag>;
// Define iterators over tiles from the A operand
using ThreadMapA = typename MmaCore::IteratorThreadMapA;
using IteratorA =
cutlass::conv::threadblock::TileIteratorStridedDgrad<
cutlass::conv::threadblock::Conv2dDgradOutputGradientTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kM, ThreadblockShape::kK>,
ElementA,
ThreadMapA,
conv::StrideSupport::kStrided
>
>;
using SmemIteratorA = typename MmaCore::SmemIteratorA;
// Define iterators over tiles from the B operand
using ThreadMapB = typename MmaCore::IteratorThreadMapB;
using IteratorB =
cutlass::conv::threadblock::TileIteratorStridedDgrad<
cutlass::conv::threadblock::Conv2dDgradFilterTileAccessIteratorOptimized<
cutlass::MatrixShape<ThreadblockShape::kK, ThreadblockShape::kN>,
ElementB,
ThreadMapB,
conv::StrideSupport::kStrided
>
>;
using SmemIteratorB = typename MmaCore::SmemIteratorB;
// Warp-level GEMM components
using WarpMmaSimtOp = typename MmaCore::MmaWarpSimt;
using MmaPolicy = typename MmaCore::MmaPolicy;
// Define the Mma
using Mma = threadblock::ImplicitGemmPipelined<
ThreadblockShape,
IteratorA,
SmemIteratorA,
IteratorB,
SmemIteratorB,
ElementC,
LayoutC,
MmaPolicy
>;
// Define the epilogue
using Epilogue = typename epilogue::threadblock::DefaultEpilogueSimtStridedDgrad<
ThreadblockShape,
WarpMmaSimtOp,
EpilogueOutputOp,
EpilogueOutputOp::kCount
>::Epilogue;
// Define the kernel
using Kernel = cutlass::conv::kernel::ImplicitGemmConvolutionStridedDgrad<
Mma,
Epilogue,
ThreadblockSwizzle,
conv::Operator::kDgrad
>;
};
} // namespace kernel
} // namespace conv
} // namespace cutlass

View File

@ -65,7 +65,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided,
/// Access granularity of A matrix in units of elements
int AlignmentA = 128 / cutlass::sizeof_bits<ElementA>::value,

View File

@ -64,7 +64,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided,
/// Access granularity of A matrix in units of elements
int AlignmentA = 128 / cutlass::sizeof_bits<ElementA>::value,

View File

@ -65,7 +65,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided,
/// Access granularity of A matrix in units of elements
int AlignmentA = 128 / cutlass::sizeof_bits<ElementA>::value,

View File

@ -66,7 +66,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided,
/// Access granularity of A matrix in units of elements
int AlignmentA = 128 / cutlass::sizeof_bits<ElementA>::value,

View File

@ -66,7 +66,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided
> struct DefaultConv3dDgrad;

View File

@ -66,7 +66,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided
> struct DefaultConv3dFprop;

View File

@ -65,7 +65,7 @@ template <
typename ThreadblockSwizzle,
int Stages,
typename MathOperatorTag,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kAnalytic,
conv::IteratorAlgorithm IteratorAlgorithm = IteratorAlgorithm::kOptimized,
conv::StrideSupport StrideSupport = StrideSupport::kStrided
> struct DefaultConv3dWgrad;

View File

@ -210,9 +210,9 @@ public:
CUTLASS_HOST_DEVICE
TensorCoord at() const {
int c = offset_c_[iteration_contiguous_];
int k = offset_k_[iteration_strided_];
int c = offset_c_[iteration_contiguous_] + iteration_vector_ * AccessType::kElements;
return TensorCoord(k, filter_r_, filter_s_, c);
}
@ -222,7 +222,7 @@ public:
TensorCoord coord = at();
return coord.n() < problem_size_.K && (coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.C;
return coord.n() < problem_size_.K && coord.c() < problem_size_.C;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -232,7 +232,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
}
@ -250,6 +250,7 @@ public:
return *this;
}
iteration_contiguous_ = 0;
++iteration_strided_;
if (iteration_strided_ < ThreadMap::Iterations::kStrided) {
return *this;
@ -408,8 +409,8 @@ public:
CUTLASS_HOST_DEVICE
TensorCoord at() const {
int c = offset_c_[iteration_contiguous_];
int k = offset_k_[iteration_strided_];
int c = offset_c_[iteration_contiguous_] + iteration_vector_ * AccessType::kElements;
return TensorCoord(k, filter_r_, filter_s_, c);
}
@ -420,7 +421,7 @@ public:
TensorCoord coord = at();
return coord.n() < problem_size_.K && (coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.C;
return coord.n() < problem_size_.K && coord.c() < problem_size_.C;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -430,7 +431,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
}
/// Increments to the next memory access

View File

@ -67,6 +67,282 @@ class Conv2dDgradFilterTileAccessIteratorOptimized;
/////////////////////////////////////////////////////////////////////////////////////////////////
// Conv2dDgradFilterTileAccessIteratorOptimized unity strided dgrad is more performant for dgrad
// on problem sizes with stride = {1x1}
template <
typename Shape_,
typename Element_,
typename ThreadMap_,
typename AccessType_
>
class Conv2dDgradFilterTileAccessIteratorOptimized <
Shape_,
Element_,
ThreadMap_,
conv::StrideSupport::kStrided,
AccessType_
> {
public:
//
// Types
//
using Shape = Shape_;
using Element = Element_;
using Layout = layout::TensorNHWC;
using ThreadMap = ThreadMap_;
using AccessType = AccessType_;
using TensorRef = cutlass::TensorRef<Element, Layout>;
using TensorCoord = typename Layout::TensorCoord;
using Index = typename Layout::Index;
using LongIndex = typename Layout::LongIndex;
static IteratorAlgorithm const kIteratorAlgorithm = conv::IteratorAlgorithm::kOptimized;
static StrideSupport const kStrideSupport = conv::StrideSupport::kStrided;
static int const kConvDim = 2;
using ConvProblemSize = typename conv::Conv2dProblemSize;
static int const kAccessesPerVector = ThreadMap::kElementsPerAccess / AccessType::kElements;
static_assert(!(ThreadMap::kElementsPerAccess % AccessType::kElements),
"Vectors implied by the thread map must be divisible by the access type.");
//
// Parameters structure
//
struct Params : Conv2dStridedDgradFilterIteratorOptimizedParams {
//
// Methods
//
CUTLASS_HOST_DEVICE
Params() { }
CUTLASS_HOST_DEVICE
Params(Conv2dStridedDgradFilterIteratorOptimizedParams const &base):
Conv2dStridedDgradFilterIteratorOptimizedParams(base) { }
CUTLASS_HOST_DEVICE
Params(
Conv2dProblemSize const &problem_size,
Layout const &layout
):
Conv2dStridedDgradFilterIteratorOptimizedParams(
problem_size,
layout,
sizeof_bits<Element>::value,
{Shape::kRow, Shape::kColumn},
ThreadMap::kThreads,
ThreadMap::kElementsPerAccess,
{ThreadMap::Iterations::kContiguous, ThreadMap::Iterations::kStrided},
{ThreadMap::Delta::kContiguous, ThreadMap::Delta::kStrided}
) { }
};
private:
Conv2dStridedDgradFilterIteratorOptimizedParams const &params_;
Conv2dProblemSize const &problem_size_;
LongIndex iteration_contiguous_;
LongIndex iteration_strided_;
LongIndex iteration_vector_;
char const *pointer_;
uint32_t predicates_[kAccessesPerVector];
int filter_k_;
int filter_r_;
int filter_s_;
int start_r_;
int start_s_;
int64_t reset_bytes_s_;
int64_t reset_bytes_r_;
//
// Assertions
//
// We map predicates into bits packed in this uint32_t container
static_assert(ThreadMap::Iterations::kStrided *
ThreadMap::Iterations::kContiguous < sizeof(predicates_) * 8,
"Currently, the number of loads per iteration is limited by the size of the predicates container.");
public:
CUTLASS_HOST_DEVICE
Conv2dDgradFilterTileAccessIteratorOptimized(
Conv2dStridedDgradFilterIteratorOptimizedParams const &params,
Conv2dProblemSize const &problem_size,
Element const *ptr,
int thread_idx,
int start_r, int start_s,
MatrixCoord const &threadblock_offset = MatrixCoord()
):
params_(params),
problem_size_(problem_size),
pointer_(reinterpret_cast<char const *>(ptr)),
predicates_{0},
filter_r_(start_r),
filter_s_(start_s),
start_r_(start_r),
start_s_(start_s) {
layout::PitchLinearCoord thread_coord = ThreadMap::initial_offset(thread_idx);
filter_k_ = threadblock_offset.row() + thread_coord.strided();
Index column = threadblock_offset.column() + thread_coord.contiguous();
reset_bytes_s_ = (problem_size_.num_gemm_k_filter_s(start_s_) - 1) * params_.inc_next[0];
reset_bytes_r_ = reset_bytes_s_ +
(problem_size_.num_gemm_k_filter_r(start_r_) - 1) * params_.inc_next[1];
CUTLASS_PRAGMA_UNROLL
for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) {
CUTLASS_PRAGMA_UNROLL
for (int c = 0; c < ThreadMap::Iterations::kContiguous; ++c) {
int filter_k = filter_k_ + s * ThreadMap::Delta::kStrided;
int filter_c = column + c * ThreadMap::Delta::kContiguous;
CUTLASS_PRAGMA_UNROLL
for (int v = 0; v < kAccessesPerVector; ++v) {
uint32_t pred = ((filter_k < problem_size_.K && (filter_c + v * AccessType::kElements) < problem_size_.C) ? 1u : 0);
int pred_idx = c + s * ThreadMap::Iterations::kContiguous;
predicates_[v] |= (pred << pred_idx);
}
}
}
TensorCoord coord{filter_k_, filter_r_, filter_s_, column};
pointer_ += params_.layout(coord) * sizeof_bits<Element>::value / 8;
set_iteration_index(0);
}
/// Overrides the internal iteration index
CUTLASS_HOST_DEVICE
void set_iteration_index(Index index) {
iteration_vector_ = index % kAccessesPerVector;
int residual_access = index / kAccessesPerVector;
iteration_contiguous_ = residual_access % ThreadMap::Iterations::kContiguous;
iteration_strided_ = residual_access / ThreadMap::Iterations::kContiguous;
}
/// Adds a pointer offset in units of Element
CUTLASS_HOST_DEVICE
void add_pointer_offset(LongIndex pointer_offset) {
pointer_ += pointer_offset * sizeof_bits<Element>::value / 8;
}
CUTLASS_HOST_DEVICE
void advance() {
int next_idx = 0;
LongIndex reset_bytes = params_.reset_bytes;
// Move filter_s by stride_w
filter_s_ += problem_size_.stride_w;
if (filter_s_ >= problem_size_.S) {
// Restore filter_s
filter_s_ = start_s_;
// Move filter_r by stride_h
filter_r_ += problem_size_.stride_h;
bool check = (filter_r_ < problem_size_.R);
filter_r_ = check ? filter_r_ : start_r_;
next_idx = check ? 1 : 2;
reset_bytes += (check ? reset_bytes_s_ : reset_bytes_r_);
}
// offset pointers by offset_bytes
pointer_ += (params_.inc_next[next_idx] - reset_bytes);
if (next_idx == 2) {
filter_k_ += params_.filter_k_delta;
}
// Clear predicates if needed
CUTLASS_PRAGMA_UNROLL
for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) {
if (filter_k_ + s * ThreadMap::Delta::kStrided >= problem_size_.K) {
uint32_t kClearMask = ((1u << ThreadMap::Iterations::kContiguous) - 1) << (s * ThreadMap::Iterations::kContiguous);
CUTLASS_PRAGMA_UNROLL
for (int v = 0; v < kAccessesPerVector; ++v) {
predicates_[v] = (predicates_[v] & (~kClearMask));
}
}
}
}
/// Returns true if the current coordinate is within the filter tensor W
CUTLASS_HOST_DEVICE
bool valid() {
LongIndex pred_idx = iteration_contiguous_ + iteration_strided_ * ThreadMap::Iterations::kContiguous;
return (predicates_[iteration_vector_] & (1u << pred_idx));
}
/// Returns a pointer to the vector starting at the current coordinate
CUTLASS_HOST_DEVICE
AccessType const *get() const {
return reinterpret_cast<AccessType const *>(pointer_ +
iteration_contiguous_ * ThreadMap::Delta::kContiguous * sizeof_bits<Element>::value / 8) + iteration_vector_;
}
/// Increments to the next memory access
CUTLASS_HOST_DEVICE
Conv2dDgradFilterTileAccessIteratorOptimized &operator++() {
++iteration_vector_;
if (iteration_vector_ < kAccessesPerVector) {
return *this;
}
iteration_vector_ = 0;
++iteration_contiguous_;
if (iteration_contiguous_ < ThreadMap::Iterations::kContiguous) {
return *this;
}
iteration_contiguous_ = 0;
++iteration_strided_;
if (iteration_strided_ < ThreadMap::Iterations::kStrided) {
// Move to the next K coordinate within the tile
pointer_ += params_.inc_next_strided;
return *this;
}
iteration_strided_ = 0;
return *this;
}
/// Determines whether the Implicit GEMM can execute the given problem.
CUTLASS_HOST_DEVICE
static Status can_implement(Conv2dProblemSize const &problem_size) {
// check alignment constraint on iterator's contiguous dimension
if (problem_size.C % AccessType::kElements) {
return Status::kErrorInvalidProblem;
}
return Status::kSuccess;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
// Conv2dDgradFilterTileAccessIteratorOptimized unity strided dgrad is more performant for dgrad
// on problem sizes with stride = {1x1}
template <

View File

@ -268,11 +268,13 @@ public:
p += (conv_sign * (filter_r_ / problem_size_.stride_h));
q += (conv_sign * (filter_s_ / problem_size_.stride_w));
int k = filter_k_ + iteration_vector_ * AccessType::kElements;
return TensorCoord(
n,
p,
q,
filter_k_);
k);
}
@ -286,7 +288,7 @@ public:
coord.n() < problem_size_.N &&
coord.h() >= 0 && coord.h() < problem_size_.P &&
coord.w() >= 0 && coord.w() < problem_size_.Q &&
(coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.K;
coord.c() < problem_size_.K;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -296,7 +298,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
}
/// Increments to the next memory access
@ -313,6 +315,7 @@ public:
return *this;
}
iteration_contiguous_ = 0;
++iteration_strided_;
if (iteration_strided_ < ThreadMap::Iterations::kStrided) {
return *this;
@ -516,7 +519,9 @@ public:
int p = (h + problem_size_.pad_h - r * problem_size_.dilation_h) / problem_size_.stride_h;
int q = (w + problem_size_.pad_w - s * problem_size_.dilation_w) / problem_size_.stride_w;
return TensorCoord(n, p, q, filter_k_);
int k = filter_k_ + iteration_vector_ * AccessType::kElements;
return TensorCoord(n, p, q, k);
}
@ -529,7 +534,7 @@ public:
return coord.n() < problem_size_.N &&
coord.h() >= 0 && coord.h() < problem_size_.P &&
coord.w() >= 0 && coord.w() < problem_size_.Q &&
(coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.K;
coord.c() < problem_size_.K;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -539,7 +544,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
}
/// Increments to the next memory access

View File

@ -67,6 +67,380 @@ template <
class Conv2dDgradOutputGradientTileAccessIteratorOptimized;
/////////////////////////////////////////////////////////////////////////////////////////////////
/////////////////////////////////////////////////////////////////////////////////////////////////
// Conv2dDgradOutputGradientTileAccessIteratorOptimized strided dgrad needs special handling
// to skip MMAs (Dx = Dy * w) on invalid filter positions
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename Shape_,
typename Element_,
typename ThreadMap_,
typename AccessType_
>
class Conv2dDgradOutputGradientTileAccessIteratorOptimized <
Shape_,
Element_,
ThreadMap_,
conv::StrideSupport::kStrided,
AccessType_
> {
public:
//
// Types
//
using Shape = Shape_;
using Element = Element_;
using Layout = layout::TensorNHWC;
using ThreadMap = ThreadMap_;
using AccessType = AccessType_;
using TensorRef = cutlass::TensorRef<Element, Layout>;
using TensorCoord = typename Layout::TensorCoord;
using Index = typename Layout::Index;
using LongIndex = typename Layout::LongIndex;
static IteratorAlgorithm const kIteratorAlgorithm = conv::IteratorAlgorithm::kOptimized;
static StrideSupport const kStrideSupport = conv::StrideSupport::kStrided;
static int const kConvDim = 2;
using ConvProblemSize = typename conv::Conv2dProblemSize;
static int const kAccessesPerVector = ThreadMap::kElementsPerAccess / AccessType::kElements;
static_assert(!(ThreadMap::kElementsPerAccess % AccessType::kElements),
"Vectors implied by the thread map must be divisible by the access type.");
using Mask = uint64_t;
static_assert(sizeof_bits<Element>::value >= 8,
"DGRAD requires elements of size 8b or greater.");
//
// Simpligying assertions
//
static_assert(ThreadMap::Iterations::kContiguous == 1,
"Require Iterations::kContiguous == 1");
//
// Parameters structure
//
using Params = Conv2dStridedDgradOutputGradientIteratorOptimizedParams;
private:
Params const &params_;
Conv2dProblemSize const &problem_size_;
LongIndex iteration_contiguous_;
LongIndex iteration_strided_;
LongIndex iteration_vector_;
// One pointer per access
char const *pointer_[ThreadMap::Iterations::kStrided];
int filter_k_;
int filter_r_;
int filter_s_;
int start_r_;
int start_s_;
int64_t reset_bytes_s_;
int64_t reset_bytes_r_;
Index masks_[ThreadMap::Iterations::kStrided][kAccessesPerVector][2];
public:
CUTLASS_HOST_DEVICE
Conv2dDgradOutputGradientTileAccessIteratorOptimized(
Params const &params,
Conv2dProblemSize const &problem_size,
Element const *ptr,
int thread_idx,
FastDivmod const &stride_h_divmod, FastDivmod const &stride_w_divmod,
int start_r, int start_s,
MatrixCoord const &threadblock_offset = MatrixCoord() // threadblock offset - units are whole CTA tiles
):
params_(params),
problem_size_(problem_size),
filter_k_(0),
filter_r_(start_r),
filter_s_(start_s),
start_r_(start_r),
start_s_(start_s) {
layout::PitchLinearCoord thread_coord = ThreadMap::initial_offset(thread_idx);
filter_k_ = threadblock_offset.column() + thread_coord.contiguous();
reset_bytes_s_ = (problem_size_.num_gemm_k_filter_s(start_s_) - 1) * params_.inc_next[0];
reset_bytes_r_ = (problem_size_.num_gemm_k_filter_s(start_s_) - 1) * params_.inc_next[0] +
(problem_size_.num_gemm_k_filter_r(start_r_) - 1) * params_.inc_next[1];
int offset_n[ThreadMap::Iterations::kStrided];
int offset_p[ThreadMap::Iterations::kStrided];
int offset_q[ThreadMap::Iterations::kStrided];
int filter_r = filter_r_;
int filter_s = filter_s_;
if (problem_size_.mode == Mode::kConvolution) {
filter_r = (problem_size_.R - 1 - filter_r);
filter_s = (problem_size_.S - 1 - filter_s);
}
// Starting h, w positions for filter position in gemm_k=0
int start_h, start_w;
strided_dgrad_starting_coords(
problem_size_,
stride_h_divmod, stride_w_divmod,
filter_r, filter_s,
start_h, start_w);
// Effective starting P and Q for filter position required for remapping NHW rows
int P = (problem_size_.H - start_h + problem_size_.stride_h - 1) / problem_size_.stride_h;
int Q = (problem_size_.W - start_w + problem_size_.stride_w - 1) / problem_size_.stride_w;
CUTLASS_PRAGMA_UNROLL
for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) {
pointer_[s] = reinterpret_cast<char const *>(ptr);
int offset_npq = (threadblock_offset.row() + thread_coord.strided() + s * ThreadMap::Delta::kStrided) % params_.tiled_rows_per_filter;
// (STEP 1) [reorder NHW rows to start with same filter positions]
offset_n[s] = offset_npq / (P * Q);
int residual = offset_npq % (P * Q);
int p = (residual / Q);
int q = (residual % Q);
int mapped_h = (start_h + p * problem_size_.stride_h);
int mapped_w = (start_w + q * problem_size_.stride_w);
// Access (p, q) coordinates for Dy tensor for filter position in gemm_k=0
// note that (h + pad_h - filter_r) and (w + pad_w - filter_s) are ensured to be
// divisible by stride_h and stride_w
offset_p[s] = (mapped_h + problem_size_.pad_h - filter_r) / problem_size_.stride_h;
offset_q[s] = (mapped_w + problem_size_.pad_w - filter_s) / problem_size_.stride_w;
// Intialize pointers for gemm_k=0
TensorCoord coord{offset_n[s], offset_p[s], offset_q[s], filter_k_};
pointer_[s] += params_.layout(coord) * sizeof_bits<Element>::value / 8;
}
//
// Precompute mask predicates
//
clear_mask();
CUTLASS_PRAGMA_NO_UNROLL
for (int r = start_r; r < problem_size_.R; r += problem_size_.stride_h) {
CUTLASS_PRAGMA_UNROLL
for (int s_idx = 0; s_idx < ThreadMap::Iterations::kStrided; ++s_idx) {
int p = offset_p[s_idx] ;
p += (params_.conv_sign * (r / problem_size_.stride_h));
bool pred = (offset_n[s_idx] < problem_size_.N && p >= 0 && p < problem_size_.P);
CUTLASS_PRAGMA_UNROLL
for (int v_idx = 0; v_idx < kAccessesPerVector; ++v_idx) {
masks_[s_idx][v_idx][0] |= (pred << r);
}
}
}
CUTLASS_PRAGMA_NO_UNROLL
for(int s = start_s; s < problem_size_.S; s += problem_size_.stride_w) {
CUTLASS_PRAGMA_UNROLL
for (int s_idx = 0; s_idx < ThreadMap::Iterations::kStrided; ++s_idx) {
int q = offset_q[s_idx];
q += (params_.conv_sign * (s / problem_size_.stride_w));
bool pred = (q >=0 && q < problem_size_.Q);
CUTLASS_PRAGMA_UNROLL
for (int v_idx = 0; v_idx < kAccessesPerVector; ++v_idx) {
masks_[s_idx][v_idx][1] |= (pred << s);
}
}
}
CUTLASS_PRAGMA_UNROLL
for (int v_idx = 0; v_idx < kAccessesPerVector; ++v_idx) {
clear_mask(v_idx, (filter_k_ + v_idx * AccessType::kElements) >= problem_size.K);
}
set_iteration_index(0);
}
CUTLASS_HOST_DEVICE
static Params getParams(Conv2dProblemSize const &problem_size, Layout const &layout) {
return Params(problem_size,
layout,
sizeof_bits<Element>::value,
{Shape::kRow, Shape::kColumn});
}
private:
/// Adds a pointer offset in units of element
CUTLASS_HOST_DEVICE
void add_byte_offset_(LongIndex byte_offset, LongIndex byte_reset = 0) {
CUTLASS_PRAGMA_UNROLL
for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) {
pointer_[s] += byte_offset - byte_reset;
}
}
public:
/// Overrides the internal iteration index
CUTLASS_HOST_DEVICE
void set_iteration_index(Index index) {
iteration_vector_ = index % kAccessesPerVector;
int residual_access = index / kAccessesPerVector;
iteration_contiguous_ = residual_access % ThreadMap::Iterations::kContiguous;
iteration_strided_ = residual_access / ThreadMap::Iterations::kContiguous;
}
/// Adds a pointer offset in units of Element
CUTLASS_HOST_DEVICE
void add_pointer_offset(LongIndex pointer_offset) {
add_byte_offset_(pointer_offset * sizeof_bits<Element>::value / 8);
}
CUTLASS_HOST_DEVICE
void advance() {
int next_idx = 0;
int64_t reset_bytes = 0;
// Move filter_s by stride_w
filter_s_ += problem_size_.stride_w;
if (filter_s_ >= problem_size_.S) {
// Restore filter_s
filter_s_ = start_s_;
// Move filter_r by stride_h
filter_r_ += problem_size_.stride_h;
if (filter_r_ < problem_size_.R) {
next_idx = 1;
// Restore bytes in q coordinate (Mma in filter s dimenstion)
reset_bytes = reset_bytes_s_;
} else {
// Restore filter_r
filter_r_ = start_r_;
next_idx = 2;
// Restore bytes in p and q coordinate (Mma in filter s and r dimenstion)
reset_bytes = reset_bytes_r_;
}
}
// offset pointers by offset_bytes
add_byte_offset_(params_.inc_next[next_idx] - reset_bytes);
if (next_idx == 2) {
filter_k_ += params_.filter_k_delta;
}
CUTLASS_PRAGMA_UNROLL
for (int v_idx = 0; v_idx < kAccessesPerVector; ++v_idx) {
clear_mask(v_idx, (filter_k_ + v_idx * AccessType::kElements) >= problem_size_.K);
}
}
/// Clears the predicates
CUTLASS_HOST_DEVICE
void clear_mask(bool clear = true) {
CUTLASS_PRAGMA_UNROLL
for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) {
CUTLASS_PRAGMA_UNROLL
for (int v = 0; v < kAccessesPerVector; ++v) {
masks_[s][v][0] = clear ? Mask(0) : masks_[s][v][0];
masks_[s][v][1] = clear ? Mask(0) : masks_[s][v][1];
}
}
}
/// Clears the predicates
CUTLASS_HOST_DEVICE
void clear_mask(int v, bool clear = true) {
CUTLASS_PRAGMA_UNROLL
for (int s = 0; s < ThreadMap::Iterations::kStrided; ++s) {
masks_[s][v][0] = clear ? Mask(0) : masks_[s][v][0];
masks_[s][v][1] = clear ? Mask(0) : masks_[s][v][1];
}
}
/// Returns true if the current coordinate is within the output tensor Dy
CUTLASS_HOST_DEVICE
bool valid() const {
return
(masks_[iteration_strided_][iteration_vector_][0] & (Index(1) << filter_r_)) &&
(masks_[iteration_strided_][iteration_vector_][1] & (Index(1) << filter_s_));
}
/// Returns a pointer to the vector starting at the current coordinate
CUTLASS_HOST_DEVICE
AccessType const *get() const {
return reinterpret_cast<AccessType const *>(pointer_[iteration_strided_]) + iteration_vector_;
}
/// Increments to the next memory access
CUTLASS_HOST_DEVICE
Conv2dDgradOutputGradientTileAccessIteratorOptimized &operator++() {
++iteration_vector_;
if (iteration_vector_ < kAccessesPerVector) {
return *this;
}
iteration_vector_ = 0;
++iteration_contiguous_;
if (iteration_contiguous_ < ThreadMap::Iterations::kContiguous) {
return *this;
}
iteration_contiguous_ = 0;
++iteration_strided_;
if (iteration_strided_ < ThreadMap::Iterations::kStrided) {
return *this;
}
iteration_strided_ = 0;
return *this;
}
/// Determines whether the Implicit GEMM can execute the given problem.
CUTLASS_HOST_DEVICE
static Status can_implement(Conv2dProblemSize const &problem_size) {
// check alignment constraint on iterator's contiguous dimension
if (problem_size.K % AccessType::kElements) {
return Status::kErrorInvalidProblem;
}
// Limit on filter size
if (problem_size.R > 32 || problem_size.S > 32) {
return Status::kErrorNotSupported;
}
return Status::kSuccess;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
// Conv2dDgradOutputGradientTileAccessIteratorOptimized unity stride dgrad is optimized for dgrad
// with problem stride = {1x1}

View File

@ -209,7 +209,9 @@ public:
int h = p * problem_size_.stride_h - problem_size_.pad_h + r * problem_size_.dilation_h;
int w = q * problem_size_.stride_w - problem_size_.pad_w + s * problem_size_.dilation_w;
return TensorCoord(n, h, w, filter_c_);
int c = filter_c_ + iteration_vector_ * AccessType::kElements;
return TensorCoord(n, h, w, c);
}
/// Returns true if the current coordinate is within the activations tensor X
@ -221,7 +223,7 @@ public:
return coord.n() < problem_size_.N &&
coord.h() >= 0 && coord.h() < problem_size_.H &&
coord.w() >= 0 && coord.w() < problem_size_.W &&
(coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.C;
coord.c() < problem_size_.C;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -231,7 +233,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
AccessType const *ptr = reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
AccessType const *ptr = reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
return ptr;
}

View File

@ -183,8 +183,9 @@ public:
TensorCoord at() const {
int k = offset_k_[iteration_strided_];
int c = filter_c_ + iteration_vector_ * AccessType::kElements;
return TensorCoord(k, filter_r_, filter_s_, filter_c_);
return TensorCoord(k, filter_r_, filter_s_, c);
}
/// Returns true if the current coordinate is within the activations tensor W
@ -194,7 +195,7 @@ public:
TensorCoord coord = at();
return coord.n() < problem_size_.K &&
(coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.C;
coord.c() < problem_size_.C;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -204,7 +205,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
}
/// Increments to the next memory access

View File

@ -527,6 +527,64 @@ struct Conv2dDgradOutputGradientIteratorOptimizedParams {
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
// Strided Dgrad Optimized Dy params (layout::TensorNHWC)
/////////////////////////////////////////////////////////////////////////////////////////////////
struct Conv2dStridedDgradOutputGradientIteratorOptimizedParams {
using Layout = layout::TensorNHWC;
Layout layout;
int64_t inc_next[3]; // {next S, next R, next K}
int filter_k_delta; // number of logical elements to add to filter_k_
int tiled_rows_per_filter;
int conv_sign;
//
// Methods
//
CUTLASS_HOST_DEVICE
Conv2dStridedDgradOutputGradientIteratorOptimizedParams() { }
CUTLASS_HOST_DEVICE
Conv2dStridedDgradOutputGradientIteratorOptimizedParams(
Conv2dProblemSize const &problem_size,
Layout const &layout, ///< layout object
int element_size_bits, ///< size of each element in bits
MatrixCoord threadblock_shape
): layout(layout) {
int tile_m_per_filter = strided_dgrad_tile_m_per_filter(problem_size, threadblock_shape.row());
tiled_rows_per_filter = tile_m_per_filter * threadblock_shape.row();
conv_sign = (problem_size.mode == Mode::kConvolution ? 1 : -1);
// next S
inc_next[0] = conv_sign * (
layout.stride()[0] * problem_size.dilation_w
) * element_size_bits / 8;
// next R
inc_next[1] = conv_sign * (
layout.stride()[1] * problem_size.dilation_h
) * element_size_bits / 8;
// next K
inc_next[2] = (
threadblock_shape.column() * problem_size.split_k_slices
) * element_size_bits / 8;
// logical offset added to internal channel counter - units are elements, not bytes
filter_k_delta = threadblock_shape.column() * problem_size.split_k_slices;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
////////////////////////////////////////////////////////////////////////////////////////////////
// Dgrad Optimized w params (layout::TensorNHWC)
/////////////////////////////////////////////////////////////////////////////////////////////////
@ -584,6 +642,73 @@ struct Conv2dDgradFilterIteratorOptimizedParams {
/////////////////////////////////////////////////////////////////////////////////////////////////
////////////////////////////////////////////////////////////////////////////////////////////////
// StridedDgrad Optimized w params (layout::TensorNHWC)
/////////////////////////////////////////////////////////////////////////////////////////////////
struct Conv2dStridedDgradFilterIteratorOptimizedParams {
using Layout = layout::TensorNHWC;
Layout layout;
int RS;
int filter_k_delta;
int64_t inc_next_strided; // offset in units of bytes to next K coordinate within tile
int64_t inc_next[3]; // {next S, next R, next K}
int64_t reset_bytes; // offset in units of bytes to move back the pointer
//
// Methods
//
CUTLASS_HOST_DEVICE
Conv2dStridedDgradFilterIteratorOptimizedParams() { }
CUTLASS_HOST_DEVICE
Conv2dStridedDgradFilterIteratorOptimizedParams(
Conv2dProblemSize const &problem_size,
Layout const &layout,
int element_size_bits, ///< size of each element in bits
MatrixCoord threadblock_shape,
int thread_count,
int access_size,
layout::PitchLinearCoord threadmap_iterations,
layout::PitchLinearCoord threadmap_delta
):
layout(layout), RS(problem_size.R * problem_size.S) {
TRACE_CONV_INITIALIZERS("conv2d_dgrad", "filter",
element_size_bits, threadblock_shape, thread_count, access_size, threadmap_iterations, threadmap_delta);
inc_next_strided = (layout.stride()[2] * threadmap_delta.strided() * element_size_bits) / 8;
// next S
inc_next[0] =
( layout.stride()[0] * problem_size.stride_w
//- (threadmap_iterations.strided() - 1) * threadmap_delta.strided() * layout.stride()[2]
) * element_size_bits / 8;
// next R
inc_next[1] =
( layout.stride()[1] * problem_size.stride_h
//- (threadmap_iterations.strided() - 1) * threadmap_delta.strided() * layout.stride()[2]
) * element_size_bits / 8;
// next K
inc_next[2] =
(
threadblock_shape.row() * problem_size.split_k_slices * layout.stride()[2]
//- (problem_size.R * problem_size.S - 1) * layout.stride()[0]
//- (threadmap_iterations.strided() - 1) * threadmap_delta.strided() * layout.stride()[2]
) * element_size_bits / 8;
// offset in units of bytes to move the pointer in backward direction
reset_bytes = (threadmap_iterations.strided() - 1) * threadmap_delta.strided() * layout.stride()[2]
* element_size_bits / 8;
filter_k_delta = threadblock_shape.row() * problem_size.split_k_slices;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
/// Parameters object for Conv2d WGRAD Output Gradient (dy) iterator
struct Conv2dWgradOutputGradientIteratorOptimizedParams {

View File

@ -183,10 +183,13 @@ public:
int r, s, c;
if (kAccessesPerVector == 1) {
/// One 128b aligned access fetching more than one element
c = filter_c_[iteration_contiguous_];
r = filter_r_[iteration_contiguous_];
s = filter_s_[iteration_contiguous_];
c = filter_c_[iteration_contiguous_];
} else {
}
else {
/// Multiple access to support non-128b alignment in contiguous dimenstion
c = (filter_c_[iteration_contiguous_] + iteration_vector_ * AccessType::kElements) % problem_size_.C;
int wrap_c = (filter_c_[iteration_contiguous_] + iteration_vector_ * AccessType::kElements) / problem_size_.C;
s = (filter_s_[iteration_contiguous_] + wrap_c) % problem_size_.S;

View File

@ -205,6 +205,8 @@ public:
int c = filter_c_[iteration_contiguous_];
if (kAccessesPerVector > 1) {
// This code section is only to support non-128b alignment
// Multiple access to support non-128b alignment in contiguous dimenstion
int wrap_c;
params_.c_divmod(wrap_c, c, c + iteration_vector_ * AccessType::kElements);

View File

@ -182,7 +182,9 @@ public:
int p = residual / problem_size_.Q;
int q = residual % problem_size_.Q;
return TensorCoord(n, p, q, filter_k_[iteration_contiguous_]);
int k = filter_k_[iteration_contiguous_] + iteration_vector_ * AccessType::kElements;
return TensorCoord(n, p, q, k);
}
@ -194,7 +196,7 @@ public:
return coord.n() < problem_size_.N &&
coord.h() < problem_size_.P &&
coord.w() < problem_size_.Q &&
(coord.c() + iteration_vector_ * AccessType::kElements) < problem_size_.K;
coord.c() < problem_size_.K;
}
/// Returns a pointer to the vector starting at the current coordinate
@ -204,7 +206,7 @@ public:
TensorCoord coord = at();
LongIndex offset = params_.layout(coord);
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8) + iteration_vector_;
return reinterpret_cast<AccessType const *>(pointer_ + offset * sizeof_bits<Element>::value / 8);
}
/// Increments to the next memory access

View File

@ -192,6 +192,32 @@ struct GELU_taylor {
}
};
template <int N>
struct GELU_taylor<Array<half_t, N> > {
static const bool kIsHeavy=true;
CUTLASS_HOST_DEVICE
Array<half_t, N> operator()(Array<half_t, N> const &z) const {
using T = half_t;
Array<half_t, N> y;
half_t k0 = half_t(0.7978845608028654);
half_t k1 = half_t(0.044715);
multiply_add<Array<half_t, N>> fma;
multiplies<Array<half_t, N>> mul;
plus<Array<half_t, N>> add;
fast_tanh_op<Array<half_t, N>> tanh;
Array<half_t, N> u = mul(mul(k0, z), fma(mul(k1, z), z, cutlass::constants::one<T>()));
y = mul(mul(z, cutlass::constants::half<T>()), add(cutlass::constants::one<T>(), tanh(u)));
return y;
}
};
template <typename T, int N>
struct GELU_taylor<Array<T, N> > {
static const bool kIsHeavy=true;

View File

@ -234,8 +234,9 @@ public:
if (WarpShape::kN == 64) {
ptr = pointers_[n / 4];
}
#else
else
#endif
{
// This is the reference implementation
int column_idx = warp_column_ + n * Detail::kLanesInQuad * Policy::kElementsPerAccess;
int ptr_idx = ((column_idx * sizeof_bits<Element>::value) / 1024) % Detail::kPointerCount;
@ -252,7 +253,8 @@ public:
else if (ptr_idx == 3) {
ptr = pointers_[3 % Detail::kPointerCount];
}
#endif
}
int offset = n * Detail::kLanesInQuad + pointer_offset / Policy::kElementsPerAccess;

View File

@ -34,6 +34,7 @@
#endif
#include "cutlass/cutlass.h"
#include "cutlass/array.h"
#include "cutlass/uint128.h"
#include "cutlass/coord.h"
#include "cutlass/numeric_types.h"
@ -724,7 +725,13 @@ double fast_log(double x) {
CUTLASS_HOST_DEVICE
float fast_tanh(float x) {
#if defined(__CUDA_ARCH__)
return ::tanhf(x);
#if (__CUDACC_VER_MAJOR__ >= 11) && (__CUDA_ARCH__ >= 750)
float y;
asm volatile ( "tanh.approx.f32 %0, %1; " : "=f"(y) : "f"(x));
return y;
#else
return ::tanhf(x);
#endif
#else
return std::tanh(x);
#endif
@ -739,6 +746,74 @@ double fast_tanh(double x) {
#endif
}
CUTLASS_HOST_DEVICE
half_t fast_tanh(half_t x) {
#if defined(__CUDA_ARCH__) && (__CUDACC_VER_MAJOR__ >= 11) && (__CUDA_ARCH__ >= 750)
asm volatile ( "tanh.approx.f16 %0, %1;" : "=h"(x.raw()) : "h"(x.raw()));
return x;
#else
return half_t(fast_tanh(float(x)));
#endif
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename T>
struct fast_tanh_op {
CUTLASS_HOST_DEVICE
T operator()(T const &rhs) const {
return fast_tanh(rhs);
}
};
#if defined(__CUDA_ARCH__) && (__CUDACC_VER_MAJOR__ >= 11) && (__CUDA_ARCH__ >= 750)
template <int N>
struct fast_tanh_op<Array<half_t, N>> {
CUTLASS_DEVICE
Array<half_t, N> operator()(Array<half_t, N> const &rhs) const {
Array<half_t, N> result;
// use x2 specialization
uint32_t const *in = reinterpret_cast<uint32_t const *>(&rhs);
uint32_t *out = reinterpret_cast<uint32_t *>(&result);
CUTLASS_PRAGMA_UNROLL
for (int i = 0; i < N / 2; ++i) {
asm volatile ("tanh.approx.f16x2 %0, %1;" : "=r"(out[i]) : "r"(in[i]));
}
// residual
if (N % 2) {
uint16_t const *in = reinterpret_cast<uint16_t const *>(&rhs);
uint16_t *out = reinterpret_cast<uint16_t *>(&result);
asm volatile ("tanh.approx.f16 %0, %1;" : "=h"(out[N - 1]) : "h"(in[N - 1]));
}
return result;
}
};
#endif // #if defined(__CUDA_ARCH__)
template <typename T, int N>
struct fast_tanh_op<Array<T, N>> {
CUTLASS_HOST_DEVICE
Array<T, N> operator()(Array<T, N> const &rhs) const {
fast_tanh_op<T> fast_op;
Array<T, N> y;
CUTLASS_PRAGMA_UNROLL
for (int i = 0; i < N; ++i) {
y[i] = fast_op(rhs[i]);
}
return y;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
} // namespace cutlass

View File

@ -126,7 +126,7 @@ struct DefaultGemmWithKReduction {
ThreadblockShape, typename Mma::Operator, kPartitionsK, EpilogueOutputOp,
EpilogueOutputOp::kCount>::Epilogue;
/// Define the epilogue
/// Define the epilogue of the reduction vector
using EpilogueGemmKReduction =
typename cutlass::epilogue::threadblock::EpilogueGemmKReduction<
ElementAccumulator, ElementC, ThreadblockShape, typename Mma::Operator, kReduceKForA>;

View File

@ -582,6 +582,13 @@ public:
__threadfence();
}
// Execute the epilogue operator to update the destination tensor.
epilogue(
output_op,
iterator_D,
accumulators,
iterator_C);
if ((kReduceKForA && threadblock_tile_offset.n() == 0)
|| (!kReduceKForA && threadblock_tile_offset.m() == 0)) {
@ -610,14 +617,7 @@ public:
&& (threadblock_tile_offset.k() > 0));
}
}
// Execute the epilogue operator to update the destination tensor.
epilogue(
output_op,
iterator_D,
accumulators,
iterator_C);
//
// Release the semaphore
//

View File

@ -378,11 +378,21 @@ struct DefaultMma<ElementA, LayoutA, kAlignmentA, ElementB, LayoutB,
|| platform::is_same<LayoutC, layout::AffineRankN<2>>::value,
"simt epilogue must be row major");
static cutlass::arch::CacheOperation::Kind const CacheOpA =
((sizeof_bits<ElementA>::value * kAlignmentA) == 128)
? cutlass::arch::CacheOperation::Global
: cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const CacheOpB =
((sizeof_bits<ElementB>::value * kAlignmentB) == 128)
? cutlass::arch::CacheOperation::Global
: cutlass::arch::CacheOperation::Always;
// Define the MmaCore components
using MmaCore = typename cutlass::gemm::threadblock::DefaultMmaCore<
ThreadblockShape, WarpShape, InstructionShape, ElementA, LayoutA,
ElementB, LayoutB, ElementAccumulator, LayoutC, arch::OpClassSimt,
Stages, Operator>;
Stages, Operator, false, CacheOpA, CacheOpB>;
// Define iterators over tiles from the A operand
using ThreadMapA = typename MmaCore::IteratorThreadMapA;

View File

@ -1111,8 +1111,8 @@ struct DefaultMmaCore<
using ElementC = complex<double>;
using LayoutC = LayoutC_;
static int const kStages = Stages;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Global;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Global;
static const ComplexTransform TransformA = TransformA_;
static const ComplexTransform TransformB = TransformB_;

View File

@ -116,11 +116,22 @@ struct DefaultMultistageMmaComplex<ElementA, LayoutA, ElementB, LayoutB,
ElementAccumulator, layout::RowMajor, OperatorClass,
ArchTag, ThreadblockShape, WarpShape,
InstructionShape, Stages, TransformA, TransformB, Operator> {
static cutlass::arch::CacheOperation::Kind const CacheOpA =
(sizeof_bits<ElementA>::value == 128)
? cutlass::arch::CacheOperation::Global
: cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const CacheOpB =
(sizeof_bits<ElementB>::value == 128)
? cutlass::arch::CacheOperation::Global
: cutlass::arch::CacheOperation::Always;
// Define the MmaCore components
using MmaCore = typename cutlass::gemm::threadblock::DefaultMultistageMmaComplexCore<
ThreadblockShape, WarpShape, InstructionShape, ElementA, LayoutA,
ElementB, LayoutB, ElementAccumulator, layout::RowMajor, OperatorClass,
Stages, TransformA, TransformB, Operator>;
Stages, TransformA, TransformB, Operator, CacheOpA, CacheOpB>;
// Define iterators over tiles from the A operand
using ThreadMapA = typename MmaCore::IteratorThreadMapA;

View File

@ -113,8 +113,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Global;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Global;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -242,8 +242,8 @@ struct DefaultMultistageMmaComplexCore<
using Operator = Operator_;
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Global;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Global;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -371,8 +371,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Global;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Global;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -501,8 +501,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Global;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Global;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -1159,8 +1159,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = CacheOpA;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = CacheOpB;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -1326,8 +1326,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = CacheOpA;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = CacheOpB;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -1490,8 +1490,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = CacheOpA;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = CacheOpB;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -1660,8 +1660,8 @@ struct DefaultMultistageMmaComplexCore<
static ComplexTransform const kTransformA = TransformA;
static ComplexTransform const kTransformB = TransformB;
using Operator = Operator_;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = cutlass::arch::CacheOperation::Always;
static cutlass::arch::CacheOperation::Kind const kCacheOpA = CacheOpA;
static cutlass::arch::CacheOperation::Kind const kCacheOpB = CacheOpB;
/// Number of warps present
using WarpCount = GemmShape<Shape::kM / WarpShape::kM,
@ -1775,7 +1775,6 @@ struct DefaultMultistageMmaComplexCore<
////////////////////////////////////////////////////////////////////////////////
} // namespace threadblock
} // namespace gemm
} // namespace cutlass

View File

@ -298,7 +298,6 @@ class PredicatedTileAccessIteratorPredicates {
return pred;
}
};
////////////////////////////////////////////////////////////////////////////////

View File

@ -49,6 +49,8 @@ target_link_libraries(
cutlass_test_unit_infra
)
set(CUTLASS_TEST_UNIT_RESULTS_CACHE_DIR ${CMAKE_CURRENT_LIST_DIR}/data/hashes)
function(cutlass_test_unit_add_executable NAME)
set(options)
@ -58,6 +60,8 @@ function(cutlass_test_unit_add_executable NAME)
cutlass_add_executable(${NAME} ${__UNPARSED_ARGUMENTS})
target_compile_definitions(${NAME} PUBLIC CUTLASS_TARGET_NAME="${NAME}")
target_link_libraries(
${NAME}
PRIVATE
@ -67,11 +71,18 @@ function(cutlass_test_unit_add_executable NAME)
string(REGEX REPLACE cutlass_ "" NAME_STEM ${NAME})
set(RESULT_CACHE_FILE "${CUTLASS_TEST_UNIT_RESULTS_CACHE_DIR}/cached_results_${NAME}.txt")
if (EXISTS ${RESULT_CACHE_FILE})
set(RESULT_CACHE_FILE_ARGS RESULT_CACHE_FILE ${RESULT_CACHE_FILE})
endif()
set(CUTLASS_TEST_UNIT_TEST_COMMAND_OPTIONS --gtest_output=xml:${NAME_STEM}.gtest.xml)
cutlass_add_executable_tests(
${NAME_STEM} ${NAME}
${NAME_STEM} ${NAME}
TEST_COMMAND_OPTIONS CUTLASS_TEST_UNIT_TEST_COMMAND_OPTIONS
${RESULT_CACHE_FILE_ARGS}
)
endfunction()

View File

@ -134,7 +134,7 @@ cutlass_test_unit_add_executable(
conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm70.cu
)
# Conv2d - F16 input, F32 output, F32 accumulation - SM75
# Conv - F16 input, F32 output, F32 accumulation - SM75
cutlass_test_unit_add_executable(
cutlass_test_unit_conv_device_tensorop_f32_sm75
@ -144,11 +144,13 @@ cutlass_test_unit_add_executable(
conv2d_fprop_with_broadcast_sm75.cu
conv2d_fprop_with_reduction_sm75.cu
conv3d_wgrad_implicit_gemm_f16ndhwc_f16ndhwc_f32ndhwc_tensor_op_f32_sm75.cu
)
if (CUTLASS_NVCC_MAX_ARCH GREATER_EQUAL 80)
# Conv2d - F16 input, F16 output, F16 accumulation
# Conv - F16 input, F16 output, F16 accumulation
cutlass_test_unit_add_executable(
cutlass_test_unit_conv_device_tensorop_f16_sm80
@ -157,24 +159,23 @@ if (CUTLASS_NVCC_MAX_ARCH GREATER_EQUAL 80)
conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f16nhwc_tensor_op_f16_sm80.cu
)
# Conv2d - F16 input, F32 output, F32 accumulation
# Conv - F16 input, F32 output, F32 accumulation
cutlass_test_unit_add_executable(
cutlass_test_unit_conv_device_tensorop_f32_sm80
# Conv2d
conv2d_fprop_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.cu
conv2d_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.cu
conv2d_wgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.cu
conv3d_wgrad_implicit_gemm_f16ndhwc_f16ndhwc_f32ndhwc_tensor_op_f32_sm75.cu
conv3d_wgrad_implicit_gemm_f16ndhwc_f16ndhwc_f32ndhwc_tensor_op_f32_sm80.cu
# Strided Dgrad
# Conv2d (Strided Dgrad)
conv2d_strided_dgrad_implicit_gemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_sm80.cu
# Conv3d
conv3d_wgrad_implicit_gemm_f16ndhwc_f16ndhwc_f32ndhwc_tensor_op_f32_sm80.cu
)
# Conv2d - TF32 input, F32 output, F32 accumulation
# Conv - TF32 input, F32 output, F32 accumulation
cutlass_test_unit_add_executable(
cutlass_test_unit_conv_device_tensorop_f32_tf32_sm80
@ -192,7 +193,6 @@ endif()
if (CUTLASS_NVCC_MAX_ARCH GREATER_EQUAL 75)
# Conv2d - S8 input, S32 output, S32 accumulation
cutlass_test_unit_add_executable(
cutlass_test_unit_conv_device_tensorop_s32
conv2d_fprop_implicit_gemm_s8nhwc_s8nhwc_s32nhwc_tensor_op_s32_sm75.cu
@ -200,7 +200,6 @@ if (CUTLASS_NVCC_MAX_ARCH GREATER_EQUAL 75)
)
# Conv2d - S8 interleaved input, S8 interleaved output, S32 accumulation
cutlass_test_unit_add_executable(
cutlass_test_unit_conv_device_tensorop_s32_interleaved
conv2d_fprop_implicit_gemm_s8ncxhwx_s8cxrskx_s8ncxhwx_tensor_op_s32_sm75.cu

View File

@ -0,0 +1,791 @@
/***************************************************************************************************
* Copyright (c) 2017-2021, NVIDIA CORPORATION. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without modification, are permitted
* provided that the following conditions are met:
* * Redistributions of source code must retain the above copyright notice, this list of
* conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright notice, this list of
* conditions and the following disclaimer in the documentation and/or other materials
* provided with the distribution.
* * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used
* to endorse or promote products derived from this software without specific prior written
* permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
* FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
* OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
**************************************************************************************************/
/*! \file
\brief Helper to construct cached name for
*/
#pragma once
#include <typeinfo>
#include <fstream>
#include <list>
#include <utility>
#include <sstream>
#include "cutlass/cutlass.h"
#include "cutlass/layout/matrix.h"
#include "cutlass/conv/convolution.h"
#include "cutlass/conv/conv2d_problem_size.h"
#include "cutlass/conv/conv3d_problem_size.h"
#include "cutlass/core_io.h"
#include "cutlass/util/tensor_view_io.h"
#ifndef CUTLASS_TEST_ENABLE_CACHED_RESULTS
#define CUTLASS_TEST_ENABLE_CACHED_RESULTS false
#endif
/////////////////////////////////////////////////////////////////////////////////////////////////
namespace test {
namespace conv {
namespace device {
/////////////////////////////////////////////////////////////////////////////////////////////////
/// Result of a test
struct CachedTestKey {
std::string op; ///< Concatenated string representation of operation performed
std::string problem; ///< Concatenated string representation of problem description
std::string types; ///< Concatenated string representation of operand types
uint32_t A; ///< Hashed result of tensor A
uint32_t B; ///< Hashed result of tensor B
uint32_t C; ///< Hashed result of tensor C
//
// Methods
//
inline CachedTestKey(): A(), B(), C() { }
inline CachedTestKey(
std::string op, ///< Concatenated string representation of operation performed
std::string problem, ///< Concatenated string representation of problem description
std::string types, ///< Concatenated string representation of operand types
uint32_t A, ///< Hashed result of tensor A
uint32_t B, ///< Hashed result of tensor B
uint32_t C ///< Hashed result of tensor C
):
op(op), problem(problem), types(types), A(A), B(B), C(C)
{ }
/// Checks for equality of the problem
bool operator==(CachedTestKey const &rhs) const {
return op == rhs.op && problem == rhs.problem && types == rhs.types && A == rhs.A && B == rhs.B && C == rhs.C;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
inline std::istream &operator>>(std::istream &in, CachedTestKey &result) {
in >> result.op;
in >> result.problem;
in >> result.types;
in >> result.A;
in >> result.B;
in >> result.C;
return in;
}
inline std::ostream &operator<<(std::ostream &out, CachedTestKey const &result) {
out << result.op << " ";
out << result.problem << " ";
out << result.types << " ";
out << result.A << " ";
out << result.B << " ";
out << result.C << " ";
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
struct CachedTestResult {
uint32_t D;
//
// Methods
//
CachedTestResult(): D() { }
CachedTestResult(uint32_t D): D(D) { }
operator bool() const {
return bool(D);
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
inline std::istream &operator>>(std::istream &in, CachedTestResult &result) {
in >> result.D;
return in;
}
inline std::ostream &operator<<(std::ostream &out, CachedTestResult const &result) {
out << result.D;
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
struct CachedTestResultListing {
std::list<std::pair<CachedTestKey, CachedTestResult>> results;
//
// Methods
//
inline CachedTestResultListing(std::string const &path) {
std::ifstream file(path);
while (file.good()) {
CachedTestKey key;
file >> key;
CachedTestResult result;
file >> result;
if (result) {
results.push_back(std::make_pair(key, result));
}
}
}
/// Returns the cached result
std::pair<bool, CachedTestResult> find(CachedTestKey const &rhs) const {
for (auto const & result : results) {
if (result.first == rhs) {
return std::make_pair(true, result.second);
}
}
return std::make_pair(false, CachedTestResult());
}
/// Appends an entry
void append(CachedTestKey const &key, CachedTestResult const &result) {
if (result) {
results.push_back(std::make_pair(key, result));
}
}
/// Writes the entire listing to a file
bool write(std::string const &path) {
std::ofstream file(path);
if (!file.good()) {
return false;
}
for (auto const &result : results) {
file << result.first << result.second << std::endl;
}
return true;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename Element>
struct ScalarEncoder {
Element scalar;
ScalarEncoder(Element s): scalar(s) { }
std::string str() const {
std::stringstream ss;
Element s = scalar;
if (s < Element()) {
s = -s;
ss << "n";
}
ss << s;
return ss.str();
}
};
template <typename Element>
ScalarEncoder<Element> EncodeScalar(Element a) {
return ScalarEncoder<Element>(a);
}
template <typename Element>
struct ScalarEncoder<cutlass::complex<Element>> {
cutlass::complex<Element> scalar;
ScalarEncoder(cutlass::complex<Element> s): scalar(s) { }
std::string str() const {
std::stringstream ss;
ss << EncodeScalar<Element>(scalar.real()) << "_" << EncodeScalar<Element>(scalar.imag()) << "i";
return ss.str();
}
};
template <typename Element>
std::ostream &operator<<(std::ostream &out, ScalarEncoder<Element> const &scalar) {
out << scalar.str();
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
inline char const *EncodeOperator(cutlass::conv::Operator conv_op) {
switch (conv_op) {
case cutlass::conv::Operator::kFprop: return "fprop";
case cutlass::conv::Operator::kDgrad: return "dgrad";
case cutlass::conv::Operator::kWgrad: return "wgrad";
}
return "conv_unknown";
}
/////////////////////////////////////////////////////////////////////////////////////////////////
// Encode GemmCoord (Gemm problem size)
inline std::ostream &EncodeProblemSize(
std::ostream &out,
cutlass::gemm::GemmCoord const &problem) {
out << problem.m() << "x" << problem.n() << "x" << problem.k() << "_";
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
// Encode Conv2dProblemSize
inline std::ostream &EncodeProblemSize(
std::ostream &out,
cutlass::conv::Conv2dProblemSize const &problem) {
out << problem.N << "x" << problem.H << "x" << problem.W << "x" << problem.C << "_"
<< problem.P << "x" << problem.Q << "_" << problem.K << "x" << problem.R << "x" << problem.S << "_";
out << "pad_h" << problem.pad_h << "w" << problem.pad_w << "_";
out << "stride_h" << problem.stride_h << "w" << problem.stride_w << "_";
out << "dil_h" << problem.dilation_h << "w" << problem.dilation_w << "_";
switch (problem.mode) {
case cutlass::conv::Mode::kCrossCorrelation:
out << "corr";
break;
case cutlass::conv::Mode::kConvolution:
out << "conv";
break;
}
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
// Encode Conv3dProblemSize
inline std::ostream &EncodeProblemSize(
std::ostream &out,
cutlass::conv::Conv3dProblemSize const &problem) {
out << problem.N << "x" << problem.D << "x" << problem.H << "x" << problem.W << "x" << problem.C << "_"
<< problem.Z << problem.P << "x" << problem.Q << "_" << problem.K << "x" << problem.R << "x" << problem.S << "_";
out << "pad_d" << problem.pad_h << "h" << problem.pad_h << "w" << problem.pad_w << "_";
out << "stride_d" << problem.stride_d << "h" << problem.stride_h << "w" << problem.stride_w << "_";
out << "dil_d" << problem.dilation_d << "h" << problem.dilation_h << "w" << problem.dilation_w << "_";
switch (problem.mode) {
case cutlass::conv::Mode::kCrossCorrelation:
out << "corr";
break;
case cutlass::conv::Mode::kConvolution:
out << "conv";
break;
}
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename Element>
inline std::string ElementTypeName() {
return std::string(typeid(Element).name());
}
template <>
inline std::string ElementTypeName<cutlass::half_t>() {
return "h";
}
template <>
inline std::string ElementTypeName<cutlass::complex<cutlass::half_t>>() {
return "ch";
}
template <>
inline std::string ElementTypeName<cutlass::bfloat16_t>() {
return "bf16";
}
template <>
inline std::string ElementTypeName<cutlass::complex<cutlass::bfloat16_t>>() {
return "cbf16";
}
template <>
inline std::string ElementTypeName<cutlass::tfloat32_t>() {
return "tf32";
}
template <>
inline std::string ElementTypeName<cutlass::complex<cutlass::tfloat32_t>>() {
return "ctf32";
}
template <>
inline std::string ElementTypeName<cutlass::complex<float>>() {
return "c";
}
template <>
inline std::string ElementTypeName<cutlass::complex<double>>() {
return "z";
}
template <>
inline std::string ElementTypeName<cutlass::Quaternion<float>>() {
return "q";
}
template <>
inline std::string ElementTypeName<int8_t>() {
return "s8";
}
template <>
inline std::string ElementTypeName<uint8_t>() {
return "u8";
}
template <>
inline std::string ElementTypeName<cutlass::int4b_t>() {
return "s4";
}
template <>
inline std::string ElementTypeName<cutlass::uint4b_t>() {
return "u4";
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename Layout>
inline std::string LayoutTypeName() {
return std::string(typeid(Layout).name());
}
template <>
inline std::string LayoutTypeName<cutlass::layout::ColumnMajor>() {
return "n";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::RowMajor>() {
return "t";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::TensorNHWC>() {
return "nhwc";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::TensorNCxHWx<32>>() {
return "nc32hw32";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::TensorNCxHWx<64>>() {
return "nc64hw64";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::TensorCxRSKx<32>>() {
return "c32rsk32";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::TensorCxRSKx<64>>() {
return "c64rsk64";
}
template <>
inline std::string LayoutTypeName<cutlass::layout::TensorNDHWC>() {
return "ndhwc";
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename Element, typename Layout>
inline std::string TensorTypeName() {
std::stringstream ss;
ss << ElementTypeName<Element>() << LayoutTypeName<Layout>();
return ss.str();
}
/////////////////////////////////////////////////////////////////////////////////////////////////
/// Hash function on a byte array
struct CRC32 {
uint32_t table[256];
//
// Methods
//
CRC32() {
uint32_t rem;
int i, j;
for (i = 0; i < 256; i++) {
rem = i;
for (j = 0; j < 8; j++) {
if (rem & 1) {
rem >>= 1;
rem ^= 0xedb88320;
} else
rem >>= 1;
}
table[i] = rem;
}
}
/// Computes the CRC of an array of bytes
uint32_t operator()(void const *start, size_t length, uint32_t crc = uint32_t()) const {
uint8_t const *p = static_cast<uint8_t const *>(start);
uint8_t const *q = static_cast<uint8_t const *>(start) + length;
crc = ~crc;
for (; p != q; ++p) {
uint8_t octet = *p;
crc = (crc >> 8) ^ table[(crc & 0xff) ^ octet];
}
return ~crc;
}
};
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename Element, typename Layout
>
uint32_t TensorHash(
cutlass::TensorView<Element, Layout> view,
CRC32 const &hash = CRC32(),
uint32_t crc = uint32_t()
) {
return hash(view.data(), view.capacity() * cutlass::sizeof_bits<Element>::value / 8, crc);
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA, typename LayoutA,
typename ElementB, typename LayoutB,
typename ElementC, typename LayoutC,
typename ElementAccumulator,
typename ElementCompute
>
inline std::ostream &EncodeTypes(
std::ostream &out
) {
out << TensorTypeName<ElementA, LayoutA>() << "_"
<< TensorTypeName<ElementB, LayoutB>() << "_"
<< TensorTypeName<ElementC, LayoutC>() << "_"
<< ElementTypeName<ElementAccumulator>() << "_"
<< ElementTypeName<ElementCompute>();
return out;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA, typename LayoutA,
typename ElementB, typename LayoutB,
typename ElementC, typename LayoutC,
typename ElementAccumulator,
typename ElementCompute
>
inline CachedTestKey CreateCachedGemmTestKey(
cutlass::gemm::GemmCoord const &problem,
ElementCompute alpha,
ElementCompute beta,
cutlass::TensorView<ElementA, LayoutA> A,
cutlass::TensorView<ElementA, LayoutB> B,
cutlass::TensorView<ElementC, LayoutC> C
) {
CachedTestKey key;
// Encode gemm operator and problem sizes
key.op = "gemm";
std::stringstream ss_problem;
EncodeProblemSize(ss_problem, problem);
ss_problem << "_alpha" << EncodeScalar(alpha) << "_beta" << EncodeScalar(beta);
key.problem = ss_problem.str();
// Encode problem data types
std::stringstream ss_types;
EncodeTypes<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute>(ss_types);
key.types = ss_types.str();
// Encode hash for problem data
CRC32 crc_hash;
key.A = TensorHash(A, crc_hash);
key.B = TensorHash(B, crc_hash);
key.C = TensorHash(C, crc_hash);
return key;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA, typename LayoutA,
typename ElementB, typename LayoutB,
typename ElementC, typename LayoutC,
typename ElementAccumulator,
typename ElementCompute
>
inline CachedTestKey CreateCachedConv2dTestKey(
cutlass::conv::Operator conv_operator,
cutlass::conv::Conv2dProblemSize const &problem,
ElementCompute alpha,
ElementCompute beta,
cutlass::TensorView<ElementA, LayoutA> A,
cutlass::TensorView<ElementA, LayoutB> B,
cutlass::TensorView<ElementC, LayoutC> C
) {
CachedTestKey key;
// Encode conv2d operator and problem sizes
key.op = "conv2d";
std::stringstream ss_problem;
ss_problem << EncodeOperator(conv_operator) << "_";
EncodeProblemSize(ss_problem, problem);
ss_problem << "_alpha" << EncodeScalar(alpha) << "_beta" << EncodeScalar(beta);
key.problem = ss_problem.str();
// Encode problem data types
std::stringstream ss_types;
EncodeTypes<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute>(ss_types);
key.types = ss_types.str();
// Encode hash for problem data
CRC32 crc_hash;
key.A = TensorHash(A, crc_hash);
key.B = TensorHash(B, crc_hash);
key.C = TensorHash(C, crc_hash);
return key;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA, typename LayoutA,
typename ElementB, typename LayoutB,
typename ElementC, typename LayoutC,
typename ElementAccumulator,
typename ElementCompute
>
inline CachedTestKey CreateCachedConv2dWithBroadcastTestKey(
cutlass::conv::Operator conv_operator,
cutlass::conv::Conv2dProblemSize const &problem,
ElementCompute alpha,
ElementCompute beta,
cutlass::TensorView<ElementA, LayoutA> A,
cutlass::TensorView<ElementA, LayoutB> B,
cutlass::TensorView<ElementC, LayoutC> C
) {
CachedTestKey key;
// Encode conv2d operator and problem sizes
key.op = "conv2d_with_broadcast";
std::stringstream ss_problem;
ss_problem << EncodeOperator(conv_operator) << "_";
EncodeProblemSize(ss_problem, problem);
ss_problem << "_alpha" << EncodeScalar(alpha) << "_beta" << EncodeScalar(beta);
key.problem = ss_problem.str();
// Encode problem data types
std::stringstream ss_types;
EncodeTypes<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute>(ss_types);
key.types = ss_types.str();
// Encode hash for problem data
CRC32 crc_hash;
key.A = TensorHash(A, crc_hash);
key.B = TensorHash(B, crc_hash);
key.C = TensorHash(C, crc_hash);
return key;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA, typename LayoutA,
typename ElementB, typename LayoutB,
typename ElementC, typename LayoutC,
typename ElementAccumulator,
typename ElementCompute
>
inline CachedTestKey CreateCachedConv2dWithReductionTestKey(
cutlass::conv::Operator conv_operator,
cutlass::conv::Conv2dProblemSize const &problem,
ElementCompute alpha,
ElementCompute beta,
cutlass::TensorView<ElementA, LayoutA> A,
cutlass::TensorView<ElementA, LayoutB> B,
cutlass::TensorView<ElementC, LayoutC> C
) {
CachedTestKey key;
// Encode conv2d operator and problem sizes
key.op = "conv2d_with_reduction";
std::stringstream ss_problem;
ss_problem << EncodeOperator(conv_operator) << "_";
EncodeProblemSize(ss_problem, problem);
ss_problem << "_alpha" << EncodeScalar(alpha) << "_beta" << EncodeScalar(beta);
key.problem = ss_problem.str();
// Encode problem data types
std::stringstream ss_types;
EncodeTypes<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute>(ss_types);
key.types = ss_types.str();
// Encode hash for problem data
CRC32 crc_hash;
key.A = TensorHash(A, crc_hash);
key.B = TensorHash(B, crc_hash);
key.C = TensorHash(C, crc_hash);
return key;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
template <
typename ElementA, typename LayoutA,
typename ElementB, typename LayoutB,
typename ElementC, typename LayoutC,
typename ElementAccumulator,
typename ElementCompute
>
inline CachedTestKey CreateCachedConv3dTestKey(
cutlass::conv::Operator conv_operator,
cutlass::conv::Conv3dProblemSize const &problem,
ElementCompute alpha,
ElementCompute beta,
cutlass::TensorView<ElementA, LayoutA> A,
cutlass::TensorView<ElementA, LayoutB> B,
cutlass::TensorView<ElementC, LayoutC> C
) {
CachedTestKey key;
// Encode conv3d operator and problem sizes
key.op = "conv3d";
std::stringstream ss_problem;
ss_problem << EncodeOperator(conv_operator) << "_";
EncodeProblemSize(ss_problem, problem);
ss_problem << "_alpha" << EncodeScalar(alpha) << "_beta" << EncodeScalar(beta);
key.problem = ss_problem.str();
// Encode problem data types
std::stringstream ss_types;
EncodeTypes<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute>(ss_types);
key.types = ss_types.str();
// Encode problem data
CRC32 crc_hash;
key.A = TensorHash(A, crc_hash);
key.B = TensorHash(B, crc_hash);
key.C = TensorHash(C, crc_hash);
return key;
}
/////////////////////////////////////////////////////////////////////////////////////////////////
} // namespace device
} // nammespace conv
} // namespace test
/////////////////////////////////////////////////////////////////////////////////////////////////

View File

@ -170,6 +170,25 @@ TEST(SM80_Device_Conv2d_Fprop_Analytic_ImplicitGemm_f16nhwc_f16nhwc_f16nhwc_tens
{1, 1} // dilation (dilation_h, dilation_w)
));
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 4, 4, 14}, // input size (NHWC)
{8, 3, 3, 14}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 23, 56, 98}, // input size (NHWC)
{128, 3, 3, 98}, // filter size (KRSC)
{4, 0, 5, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
/// Run all unit test sizes with device-level Conv2d instance
EXPECT_TRUE(test::conv::device::TestAllConv2d<Conv2dFprop>(problem_size_list));
}
@ -225,6 +244,25 @@ TEST(SM80_Device_Conv2d_Fprop_Optimized_ImplicitGemm_f16nhwc_f16nhwc_f16nhwc_ten
{1, 1} // dilation (dilation_h, dilation_w)
));
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 4, 4, 14}, // input size (NHWC)
{8, 3, 3, 14}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 23, 56, 98}, // input size (NHWC)
{128, 3, 3, 98}, // filter size (KRSC)
{4, 0, 5, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
/// Run all unit test sizes with device-level Conv2d instance
EXPECT_TRUE(test::conv::device::TestAllConv2d<Conv2dFprop>(problem_size_list));
}
@ -280,6 +318,24 @@ TEST(SM80_Device_Conv2d_Fprop_Optimized_ImplicitGemm_f16nhwc_f16nhwc_f16nhwc_ten
{1, 1} // dilation (dilation_h, dilation_w)
));
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 4, 4, 28}, // input size (NHWC)
{8, 3, 3, 28}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 23, 56, 100}, // input size (NHWC)
{128, 3, 3, 100}, // filter size (KRSC)
{4, 0, 5, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
/// Run all unit test sizes with device-level Conv2d instance
EXPECT_TRUE(test::conv::device::TestAllConv2d<Conv2dFprop>(problem_size_list));
}

View File

@ -182,7 +182,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{1, 7, 8, minimum_channel_size}, // input size (NHWC)
{8, 3, 3, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -190,7 +190,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{1, 7, 9, minimum_channel_size}, // input size (NHWC)
{8, 4, 4, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -198,7 +198,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{2, 7, 9, minimum_channel_size}, // input size (NHWC)
{8, 5, 5, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -206,7 +206,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{3, 7, 9, minimum_channel_size}, // input size (NHWC)
{8, 6, 5, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -214,7 +214,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{3, 7, 9, minimum_channel_size}, // input size (NHWC)
{8, 6, 6, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -222,7 +222,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{3, 7, 9, minimum_channel_size}, // input size (NHWC)
{8, 7, 7, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -234,7 +234,7 @@ struct TestbedConv2dProblemSizes {
// C < CTA::K and non-multiples of CTA::K. Typical CTA::K = {32, 64}
////////////////////////////////////////////////////////////////////////////////////////////
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 11, 11, minimum_channel_size}, // input size (NHWC)
{1, 11, 7, minimum_channel_size}, // input size (NHWC)
{8, 1, 1, minimum_channel_size}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
@ -242,7 +242,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 11, 11, minimum_channel_size}, // input size (NHWC)
{1, 11, 7, minimum_channel_size}, // input size (NHWC)
{8, 3, 3, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
@ -250,7 +250,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 13, 13, minimum_channel_size}, // input size (NHWC)
{1, 13, 11, minimum_channel_size}, // input size (NHWC)
{8, 1, 1, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
@ -258,40 +258,40 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, minimum_channel_size}, // input size (NHWC)
{8, 2, 2, minimum_channel_size}, // filter size (KRSC)
{1, 17, 19, minimum_channel_size}, // input size (NHWC)
{16, 2, 2, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 5, 5, minimum_channel_size}, // input size (NHWC)
{8, 3, 3, minimum_channel_size}, // filter size (KRSC)
{1, 23, 5, minimum_channel_size}, // input size (NHWC)
{16, 3, 3, minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, 8}, // input size (NHWC)
{8, 3, 3, 8}, // filter size (KRSC)
{1, 13, 17, 8}, // input size (NHWC)
{24, 3, 3, 8}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 8, 8, 8}, // input size (NHWC)
{8, 3, 3, 8}, // filter size (KRSC)
{1, 23, 21, 8}, // input size (NHWC)
{24, 3, 3, 8}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 16, 16, 8}, // input size (NHWC)
{8, 3, 3, 8}, // filter size (KRSC)
{1, 20, 24, 8}, // input size (NHWC)
{40, 3, 3, 8}, // filter size (KRSC)
{3, 3, 3, 3}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
@ -352,7 +352,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 16, 16, 64 + minimum_channel_size}, // input size (NHWC)
{1, 16, 24, 64 + minimum_channel_size}, // input size (NHWC)
{96, 3, 3, 64 + minimum_channel_size}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
@ -363,7 +363,7 @@ struct TestbedConv2dProblemSizes {
// Medium input size, filter size (1x1, 3,x3, 5x5, 7x7), stride (2, 2)
////////////////////////////////////////////////////////////////////////////////////
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 16, 16, 288}, // input size (NHWC)
{1, 13, 16, 288}, // input size (NHWC)
{160, 5, 5, 288}, // filter size (KRSC)
{2, 2, 2, 2}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
@ -371,7 +371,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 55, 55, 256}, // input size (NHWC)
{1, 55, 51, 256}, // input size (NHWC)
{512, 1, 1, 256}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
@ -379,7 +379,7 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 80, 80, 32}, // input size (NHWC)
{1, 71, 80, 32}, // input size (NHWC)
{64, 5, 5, 32}, // filter size (KRSC)
{2, 2, 2, 2}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
@ -398,7 +398,7 @@ struct TestbedConv2dProblemSizes {
// Medium input size stride (3, 3), filter (3, 3), non-default padding
////////////////////////////////////////////////////////////////////////////////////
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{1, 27, 27, 256}, // input size (NHWC)
{1, 27, 23, 256}, // input size (NHWC)
{512, 3, 3, 256}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{3, 3}, // stride (stride_h, stride_w)
@ -464,16 +464,16 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{32, 32, 32, 32}, // input size (NHWC)
{32, 1, 1, 32}, // filter size (KRSC)
{32, 24, 32, 32}, // input size (NHWC)
{32, 1, 2, 32}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{4, 3, 3, 128}, // input size (NHWC)
{256, 3, 3, 128}, // filter size (KRSC)
{4, 4, 5, 128}, // input size (NHWC)
{256, 3, 6, 128}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
{1, 1}, // dilation (dilation_h, dilation_w)
@ -481,8 +481,8 @@ struct TestbedConv2dProblemSizes {
));
conv2d_default_sizes.push_back(cutlass::conv::Conv2dProblemSize(
{4, 1, 1, 256}, // input size (NHWC)
{328, 3, 3, 256}, // filter size (KRSC)
{4, 2, 3, 256}, // input size (NHWC)
{328, 3, 5, 256}, // filter size (KRSC)
{1, 1, 1, 1}, // padding (pad_h, _, pad_w, _)
{1, 1}, // stride (stride_h, stride_w)
{1, 1}, // dilation (dilation_h, dilation_w)

View File

@ -231,4 +231,137 @@ TEST(SM80_Device_Conv2d_Strided_Dgrad_Analytic_ImplicitGemm_f16nhwc_f16nhwc_f32n
}
////////////////////////////////////////////////////////////////////////////////
////////////////////////////////////////////////////////////////////////////////
// Strided Dgrad (Optimized)
////////////////////////////////////////////////////////////////////////////////
TEST(SM80_Device_Conv2d_Strided_Dgrad_Optimized_ImplicitGemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32,
128x128_32x3_64x64x32) {
/// Conv operation element types for the Gemm equivalent (ImplicitGemm)
using ElementA = cutlass::half_t;
using ElementB = cutlass::half_t;
using ElementC = float;
using ElementAccumulator = float;
using ElementCompute = float;
/// Device-level Conv2d instance
using Conv2dDgradKernel = typename cutlass::conv::kernel::DefaultConv2dDgrad<
ElementA, cutlass::layout::TensorNHWC,
ElementB, cutlass::layout::TensorNHWC,
ElementC, cutlass::layout::TensorNHWC,
ElementAccumulator,
cutlass::arch::OpClassTensorOp,
cutlass::arch::Sm80,
cutlass::gemm::GemmShape<128, 128, 32>,
cutlass::gemm::GemmShape<64, 64, 32>,
cutlass::gemm::GemmShape<16, 8, 16>,
cutlass::epilogue::thread::LinearCombination<
ElementC,
128 / cutlass::sizeof_bits<ElementC>::value,
ElementAccumulator,
ElementCompute
>,
cutlass::conv::threadblock::StridedDgradIdentityThreadblockSwizzle<>,
3,
cutlass::arch::OpMultiplyAdd,
cutlass::conv::IteratorAlgorithm::kOptimized,
cutlass::conv::StrideSupport::kStrided
>::Kernel;
using Conv2dDgrad = cutlass::conv::device::ImplicitGemmConvolution<Conv2dDgradKernel>;
test::conv::device::Conv2dProblemVector problem_size_list;
#if 0 // run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 56, 56, 8}, // input size (NHWC)
{8, 1, 1, 8}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 55, 55, 8}, // input size (NHWC)
{8, 1, 1, 8}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
#endif
/// Run all unit test sizes with device-level Conv2d instance
EXPECT_TRUE(test::conv::device::TestAllConv2d<Conv2dDgrad>(problem_size_list));
}
////////////////////////////////////////////////////////////////////////////////
TEST(SM80_Device_Conv2d_Strided_Dgrad_Optimized_ImplicitGemm_f16nhwc_f16nhwc_f32nhwc_tensor_op_f32_align4,
128x128_32x3_64x64x32) {
/// Conv operation element types for the Gemm equivalent (ImplicitGemm)
using ElementA = cutlass::half_t;
using ElementB = cutlass::half_t;
using ElementC = float;
using ElementAccumulator = float;
using ElementCompute = float;
/// Device-level Conv2d instance
using Conv2dDgradKernel = typename cutlass::conv::kernel::DefaultConv2dDgrad<
ElementA, cutlass::layout::TensorNHWC,
ElementB, cutlass::layout::TensorNHWC,
ElementC, cutlass::layout::TensorNHWC,
ElementAccumulator,
cutlass::arch::OpClassTensorOp,
cutlass::arch::Sm80,
cutlass::gemm::GemmShape<128, 128, 32>,
cutlass::gemm::GemmShape<64, 64, 32>,
cutlass::gemm::GemmShape<16, 8, 16>,
cutlass::epilogue::thread::LinearCombination<
ElementC,
4,
ElementAccumulator,
ElementCompute
>,
cutlass::conv::threadblock::StridedDgradIdentityThreadblockSwizzle<>,
3,
cutlass::arch::OpMultiplyAdd,
cutlass::conv::IteratorAlgorithm::kOptimized,
cutlass::conv::StrideSupport::kStrided,
4,
4
>::Kernel;
using Conv2dDgrad = cutlass::conv::device::ImplicitGemmConvolution<Conv2dDgradKernel>;
test::conv::device::Conv2dProblemVector problem_size_list;
// run specific problem size in the unit test first
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 56, 56, 12}, // input size (NHWC)
{8, 1, 1, 12}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
problem_size_list.push_back(cutlass::conv::Conv2dProblemSize(
{1, 55, 55, 12}, // input size (NHWC)
{8, 1, 1, 12}, // filter size (KRSC)
{0, 0, 0, 0}, // padding (pad_h, _, pad_w, _)
{2, 2}, // stride (stride_h, stride_w)
{1, 1} // dilation (dilation_h, dilation_w)
));
/// Run all unit test sizes with device-level Conv2d instance
EXPECT_TRUE(test::conv::device::TestAllConv2d<Conv2dDgrad>(problem_size_list));
}
////////////////////////////////////////////////////////////////////////////////
#endif // CUTLASS_ARCH_MMA_SM80_SUPPORTED

View File

@ -47,6 +47,8 @@
#include "cutlass/core_io.h"
#include "cutlass/util/tensor_view_io.h"
#include "cache_testbed_output.h"
namespace test {
namespace conv {
namespace device {
@ -116,7 +118,6 @@ public:
cutlass::Distribution::Kind dist_kind,
uint64_t seed) {
//cutlass::reference::host::TensorFill(view, Element(1.0f));
if (dist_kind == cutlass::Distribution::Uniform) {
int scope;
@ -126,7 +127,12 @@ public:
scope = 2;
}
else if (bits == 16) {
scope = 3;
if (cutlass::sizeof_bits<ElementAccumulator>::value <= 16) {
scope = 3;
}
else {
scope = 5;
}
}
else {
scope = 8;
@ -137,6 +143,7 @@ public:
else if (dist_kind == cutlass::Distribution::Identity) {
cutlass::reference::host::TensorFillIdentity(view);
}
else if (dist_kind == cutlass::Distribution::Gaussian) {
@ -321,6 +328,50 @@ public:
tensor_D_computed.sync_host();
//
// Reference check - support caching results
//
CachedTestKey cached_test_key = CreateCachedConv2dTestKey<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute
>(
kConvolutionalOperator,
problem_size,
alpha,
beta,
tensor_A.host_view(),
tensor_B.host_view(),
tensor_C.host_view()
);
//
// Look for the cached key
//
bool cached_result_loaded = false;
CachedTestResult cached_test_result;
std::string conv2d_result_cache_name =
std::string("cached_results_") + CUTLASS_TARGET_NAME + ".txt";
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
CachedTestResultListing cached_results(conv2d_result_cache_name);
auto cached = cached_results.find(cached_test_key);
cached_result_loaded = cached.first;
if (cached_result_loaded) {
cached_test_result = cached.second;
}
}
if (!cached_result_loaded) {
#if CUTLASS_CONV_TEST_UNIT_REFERENCE_DEVICE_ENABLED
cutlass::reference::device::Conv2d<
@ -367,9 +418,32 @@ public:
beta);
#endif
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
cached_test_result.D = TensorHash(tensor_D_reference.host_view());
CachedTestResultListing cached_results(conv2d_result_cache_name);
cached_results.append(cached_test_key, cached_test_result);
cached_results.write(conv2d_result_cache_name);
}
} // if (!cached_result_loaded)
uint32_t tensor_D_hash = TensorHash(tensor_D_computed.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
passed = (tensor_D_hash == cached_test_result.D);
EXPECT_EQ(tensor_D_hash, cached_test_result.D)
<< "Hash-based comparison failed for key:" << "\n" << cached_test_key << "\n";
}
else {
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
}
EXPECT_TRUE(passed);
@ -416,9 +490,18 @@ public:
results
<< "\nA:\n" << tensor_A.host_view() << "\n"
<< "\nB:\n" << tensor_B.host_view() << "\n"
<< "\nC:\n" << tensor_C.host_view() << "\n"
<< "\nD reference:\n" << tensor_D_reference.host_view() << "\n"
<< "\nD computed:\n" << tensor_D_computed.host_view() << "\n";
<< "\nC:\n" << tensor_C.host_view() << "\n";
results << "\nD reference (hash: " << cached_test_result.D << ")\n";
if (!cached_result_loaded) {
results
<< tensor_D_reference.host_view() << "\n";
}
results
<< "\nD computed (hash: " << tensor_D_hash << ")\n"
<< tensor_D_computed.host_view() << "\n";
}

View File

@ -48,6 +48,8 @@
#include "cutlass/core_io.h"
#include "cutlass/util/tensor_view_io.h"
#include "cache_testbed_output.h"
namespace test {
namespace conv {
namespace device {
@ -280,6 +282,50 @@ public:
tensor_D_computed.sync_host();
//
// Reference check - support caching results
//
CachedTestKey cached_test_key = CreateCachedConv2dTestKey<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute
>(
kConvolutionalOperator,
problem_size,
alpha,
beta,
tensor_A.host_view(),
tensor_B.host_view(),
tensor_C.host_view()
);
//
// Look for the cached key
//
bool cached_result_loaded = false;
CachedTestResult cached_test_result;
std::string conv2d_result_cache_name =
std::string("cached_results_") + CUTLASS_TARGET_NAME + ".txt";
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
CachedTestResultListing cached_results(conv2d_result_cache_name);
auto cached = cached_results.find(cached_test_key);
cached_result_loaded = cached.first;
if (cached_result_loaded) {
cached_test_result = cached.second;
}
}
if (!cached_result_loaded) {
#if CUTLASS_CONV_TEST_UNIT_REFERENCE_DEVICE_ENABLED
cutlass::reference::device::Conv2d<
@ -332,9 +378,32 @@ public:
beta);
#endif
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
cached_test_result.D = TensorHash(tensor_D_reference.host_view());
CachedTestResultListing cached_results(conv2d_result_cache_name);
cached_results.append(cached_test_key, cached_test_result);
cached_results.write(conv2d_result_cache_name);
}
} // if (!cached_result_loaded)
uint32_t tensor_D_hash = TensorHash(tensor_D_computed.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
passed = (tensor_D_hash == cached_test_result.D);
EXPECT_EQ(tensor_D_hash, cached_test_result.D)
<< "Hash-based comparison failed for key:" << "\n" << cached_test_key << "\n";
}
else {
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
}
EXPECT_TRUE(passed);
@ -345,12 +414,12 @@ public:
<< (split_k_mode == cutlass::conv::SplitKMode::kSerial ? "serial_reduction_" : "parallel_reduction_")
<< (Conv2d::kConvolutionalOperator == cutlass::conv::Operator::kFprop ? "fprop_" :
(Conv2d::kConvolutionalOperator == cutlass::conv::Operator::kDgrad ? "dgrad_" : "wgrad_"))
<< "nhwc_"
<< "ncxhwx_"
<< problem_size.N << "x"
<< problem_size.H << "x"
<< problem_size.W << "x"
<< problem_size.C
<< "_krsc_"
<< "_cxrskx_"
<< problem_size.K << "x"
<< problem_size.R << "x"
<< problem_size.S << "x"
@ -381,10 +450,18 @@ public:
results
<< "\nA:\n" << tensor_A.host_view() << "\n"
<< "\nB:\n" << tensor_B.host_view() << "\n"
<< "\nB_reordered =\n" << tensor_B_reordered.host_view() << "\n"
<< "\nC:\n" << tensor_C.host_view() << "\n"
<< "\nD reference:\n" << tensor_D_reference.host_view() << "\n"
<< "\nD computed:\n" << tensor_D_computed.host_view() << "\n";
<< "\nC:\n" << tensor_C.host_view() << "\n";
results << "\nD reference (hash: " << cached_test_result.D << ")\n";
if (!cached_result_loaded) {
results
<< tensor_D_reference.host_view() << "\n";
}
results
<< "\nD computed (hash: " << tensor_D_hash << ")\n"
<< tensor_D_computed.host_view() << "\n";
}

View File

@ -47,6 +47,8 @@
#include "cutlass/core_io.h"
#include "cutlass/util/tensor_view_io.h"
#include "cache_testbed_output.h"
namespace test {
namespace conv {
namespace device {
@ -109,11 +111,17 @@ public:
scope = 2;
}
else if (bits == 16) {
scope = 3;
if (cutlass::sizeof_bits<ElementAccumulator>::value <= 16) {
scope = 3;
}
else {
scope = 5;
}
}
else {
scope = 8;
}
cutlass::reference::host::TensorFillRandomUniform(
view, seed, scope, -scope, 0);
}
@ -263,6 +271,50 @@ public:
tensor_D_computed.sync_host();
//
// Reference check - support caching results
//
CachedTestKey cached_test_key = CreateCachedConv2dWithBroadcastTestKey<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute
>(
kConvolutionalOperator,
problem_size,
alpha,
beta,
tensor_A.host_view(),
tensor_B.host_view(),
tensor_C.host_view()
);
//
// Look for the cached key
//
bool cached_result_loaded = false;
CachedTestResult cached_test_result;
std::string conv2d_result_cache_name =
std::string("cached_results_") + CUTLASS_TARGET_NAME + ".txt";
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
CachedTestResultListing cached_results(conv2d_result_cache_name);
auto cached = cached_results.find(cached_test_key);
cached_result_loaded = cached.first;
if (cached_result_loaded) {
cached_test_result = cached.second;
}
}
if (!cached_result_loaded) {
#if CUTLASS_CONV_TEST_UNIT_REFERENCE_DEVICE_ENABLED
cutlass::reference::device::Conv2d<
@ -309,9 +361,33 @@ public:
beta);
#endif
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
cached_test_result.D = TensorHash(tensor_D_reference.host_view());
CachedTestResultListing cached_results(conv2d_result_cache_name);
cached_results.append(cached_test_key, cached_test_result);
cached_results.write(conv2d_result_cache_name);
}
} // if (!cached_result_loaded)
uint32_t tensor_D_hash = TensorHash(tensor_D_computed.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
passed = (tensor_D_hash == cached_test_result.D);
EXPECT_EQ(tensor_D_hash, cached_test_result.D)
<< "Hash-based comparison failed for key:" << "\n" << cached_test_key << "\n";
}
else {
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
}
EXPECT_TRUE(passed);

View File

@ -47,6 +47,8 @@
#include "cutlass/core_io.h"
#include "cutlass/util/tensor_view_io.h"
#include "cache_testbed_output.h"
namespace test {
namespace conv {
namespace device {
@ -114,7 +116,12 @@ public:
scope = 2;
}
else if (bits == 16) {
scope = 3;
if (cutlass::sizeof_bits<ElementAccumulator>::value <= 16) {
scope = 3;
}
else {
scope = 5;
}
}
else {
scope = 8;
@ -280,6 +287,50 @@ public:
tensor_D_computed.sync_host();
//
// Reference check - support caching results
//
CachedTestKey cached_test_key = CreateCachedConv2dWithReductionTestKey<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute
>(
kConvolutionalOperator,
problem_size,
alpha,
beta,
tensor_A.host_view(),
tensor_B.host_view(),
tensor_C.host_view()
);
//
// Look for the cached key
//
bool cached_result_loaded = false;
CachedTestResult cached_test_result;
std::string conv2d_result_cache_name =
std::string("cached_results_") + CUTLASS_TARGET_NAME + ".txt";
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
CachedTestResultListing cached_results(conv2d_result_cache_name);
auto cached = cached_results.find(cached_test_key);
cached_result_loaded = cached.first;
if (cached_result_loaded) {
cached_test_result = cached.second;
}
}
if (!cached_result_loaded) {
#if CUTLASS_CONV_TEST_UNIT_REFERENCE_DEVICE_ENABLED
cutlass::reference::device::Conv2d<
@ -326,9 +377,33 @@ public:
beta);
#endif
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
cached_test_result.D = TensorHash(tensor_D_reference.host_view());
CachedTestResultListing cached_results(conv2d_result_cache_name);
cached_results.append(cached_test_key, cached_test_result);
cached_results.write(conv2d_result_cache_name);
}
} // if (!cached_result_loaded)
uint32_t tensor_D_hash = TensorHash(tensor_D_computed.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
passed = (tensor_D_hash == cached_test_result.D);
EXPECT_EQ(tensor_D_hash, cached_test_result.D)
<< "Hash-based comparison failed for key:" << "\n" << cached_test_key << "\n";
}
else {
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
}
EXPECT_TRUE(passed);

View File

@ -67,7 +67,8 @@ TEST(SM80_Device_Conv3d_Dgrad_Analytic_ImplicitGemm_tf32ndhwc_tf32ndhwc_f32ndhwc
>,
cutlass::gemm::threadblock::GemmIdentityThreadblockSwizzle<>,
3,
cutlass::arch::OpMultiplyAdd
cutlass::arch::OpMultiplyAdd,
cutlass::conv::IteratorAlgorithm::kAnalytic
>::Kernel;
using Conv3dDgrad = cutlass::conv::device::ImplicitGemmConvolution<Conv3dDgradKernel>;

View File

@ -47,6 +47,8 @@
#include "conv3d_problems.h"
#include "cutlass/core_io.h"
#include "cache_testbed_output.h"
namespace test {
namespace conv {
namespace device {
@ -321,6 +323,50 @@ public:
tensor_D_computed.sync_host();
//
// Reference check - support caching results
//
CachedTestKey cached_test_key = CreateCachedConv3dTestKey<
ElementA, LayoutA,
ElementB, LayoutB,
ElementC, LayoutC,
ElementAccumulator,
ElementCompute
>(
kConvolutionalOperator,
problem_size,
alpha,
beta,
tensor_A.host_view(),
tensor_B.host_view(),
tensor_C.host_view()
);
//
// Look for the cached key
//
bool cached_result_loaded = false;
CachedTestResult cached_test_result;
std::string conv2d_result_cache_name =
std::string("cached_results_") + CUTLASS_TARGET_NAME + ".txt";
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
CachedTestResultListing cached_results(conv2d_result_cache_name);
auto cached = cached_results.find(cached_test_key);
cached_result_loaded = cached.first;
if (cached_result_loaded) {
cached_test_result = cached.second;
}
}
if (!cached_result_loaded) {
#if CUTLASS_CONV_TEST_UNIT_REFERENCE_DEVICE_ENABLED
cutlass::reference::device::Conv3d<
@ -368,10 +414,32 @@ public:
);
#endif
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
cached_test_result.D = TensorHash(tensor_D_reference.host_view());
CachedTestResultListing cached_results(conv2d_result_cache_name);
cached_results.append(cached_test_key, cached_test_result);
cached_results.write(conv2d_result_cache_name);
}
} // if (!cached_result_loaded)
uint32_t tensor_D_hash = TensorHash(tensor_D_computed.host_view());
if (CUTLASS_TEST_ENABLE_CACHED_RESULTS) {
passed = (tensor_D_hash == cached_test_result.D);
EXPECT_EQ(tensor_D_hash, cached_test_result.D)
<< "Hash-based comparison failed for key:" << "\n" << cached_test_key << "\n";
}
else {
passed = cutlass::reference::host::TensorEquals(
tensor_D_computed.host_view(),
tensor_D_reference.host_view());
}
EXPECT_TRUE(passed);
if (!passed) {
@ -422,9 +490,19 @@ public:
results
<< "\nA:\n" << tensor_A.host_view() << "\n"
<< "\nB:\n" << tensor_B.host_view() << "\n"
<< "\nC:\n" << tensor_C.host_view() << "\n"
<< "\nD reference:\n" << tensor_D_reference.host_view() << "\n"
<< "\nD computed:\n" << tensor_D_computed.host_view() << "\n";
<< "\nC:\n" << tensor_C.host_view() << "\n";
results << "\nD reference (hash: " << cached_test_result.D << ")\n";
if (!cached_result_loaded) {
results
<< tensor_D_reference.host_view() << "\n";
}
results
<< "\nD computed (hash: " << tensor_D_hash << ")\n"
<< tensor_D_computed.host_view() << "\n";
}

View File

@ -0,0 +1,473 @@
conv2d fprop_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1291629984 4250546017 486967919 3628559084
conv2d fprop_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1291629984 4250546017 486967919 3628559084
conv2d fprop_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3269355653 987911951 1919973277 3060288390
conv2d fprop_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3269355653 987911951 1919973277 2970039207
conv2d fprop_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3748422120 3644341259 1911021900 2231724975
conv2d fprop_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3748422120 3644341259 1911021900 32368867
conv2d fprop_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 472157622 1595526728 2963892063 3617758931
conv2d fprop_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 472157622 1595526728 2963892063 1213867461
conv2d fprop_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2555494614 224923131 3862463878 1032157693
conv2d fprop_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2555494614 224923131 3862463878 2512484574
conv2d fprop_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2311828961 1219404370 373331791 156090483
conv2d fprop_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2311828961 1219404370 373331791 2125643627
conv2d fprop_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2311828961 2400093115 2695215306 1183833128
conv2d fprop_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2311828961 2400093115 2695215306 950863078
conv2d fprop_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2311828961 1018998471 2132201986 1645211922
conv2d fprop_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2311828961 1018998471 2132201986 888922489
conv2d fprop_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2296142491 4250546017 1919973277 3242947060
conv2d fprop_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2296142491 4250546017 1919973277 3242947060
conv2d fprop_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2296142491 3644341259 1919973277 2570877648
conv2d fprop_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2296142491 3644341259 1919973277 3601912269
conv2d fprop_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1218117393 4250546017 1911021900 1777629475
conv2d fprop_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1218117393 4250546017 1911021900 1777629475
conv2d fprop_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3858018920 3830842503 5067603 2056042422
conv2d fprop_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3858018920 3830842503 5067603 3581028648
conv2d fprop_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3131990564 3914955377 2695215306 1284148249
conv2d fprop_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3131990564 3914955377 2695215306 529645467
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3975452619 4213557158 2381193183 3146807750
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3975452619 4213557158 2381193183 3919362272
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1463744869 4213557158 1038140209 2259020777
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1463744869 4213557158 1038140209 2073872618
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2629906455 3838546319 720746870 2382111738
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2629906455 3838546319 720746870 1697335701
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1212756742 4265921531 2290618404 3626933660
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1212756742 4265921531 2290618404 3626933660
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 241472534 468963831 2959096809 3337392869
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 241472534 468963831 2959096809 1465273757
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 796785810 2766914163 613201518 2545095524
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 796785810 2766914163 613201518 119102005
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3566971919 3050624323 167104692 2075508652
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3566971919 3050624323 167104692 249956416
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1307031978 1633048603 2557576548 825424571
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1307031978 1633048603 2557576548 3723250582
conv2d fprop_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 51486510 2467457616 1993107524 3917445532
conv2d fprop_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 51486510 2467457616 1993107524 723144309
conv2d fprop_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 806079124 1319256657 1041989393 4007092054
conv2d fprop_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 806079124 1319256657 1041989393 121750431
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2682525616 2411959438 1222599802 2705358355
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2682525616 2411959438 1222599802 1921082534
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2113351655 1888208948 1454859747 2429064071
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2113351655 1888208948 1454859747 2429064071
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2239997711 3765480640 1933240382 258792262
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2239997711 3765480640 1933240382 1350961289
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1124828340 632037627 1966904362 2674132654
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1124828340 632037627 1966904362 4061823028
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3787124528 2799725917 3426919182 1513280885
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3787124528 2799725917 3426919182 3304279324
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2109521687 2799725917 4185476157 1062588307
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2109521687 2799725917 4185476157 1737400068
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1329557640 2685661941 623381239 3456180201
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1329557640 2685661941 623381239 612510019
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 4076621732 2799725917 748585111 1918078890
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 4076621732 2799725917 748585111 1296506717
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 4076621732 2799725917 748585111 720321141
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 4076621732 2799725917 748585111 2250020808
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3826850269 1181458623 3933470176 1216324411
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3826850269 1181458623 3933470176 1337638334
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2161330459 2750022170 3879567407 2187352956
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2161330459 2750022170 3879567407 3505172898
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 61034797 3724098469 1954437668 3275330607
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 61034797 3724098469 1954437668 3211342413
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2979706213 840940128 2268084635 2574304052
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2979706213 840940128 2268084635 959147198
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 933902974 3274942180 1217977439 1759317211
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 933902974 3274942180 1217977439 3077847987
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 525054430 617641393 90427526 1404446496
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 525054430 617641393 90427526 4261451781
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2145363230 721318312 934864596 1375658938
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2145363230 721318312 934864596 90410819
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 fnhwc_fnhwc_fnhwc_f_f 3484291824 12477519 722450442 726679987
conv2d fprop_1x1x1x2_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1291629984 4250546017 4259529924 973561880
conv2d fprop_1x1x1x2_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1291629984 4250546017 4259529924 973561880
conv2d fprop_1x1x8x2_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3269355653 987911951 2963892063 653870217
conv2d fprop_1x1x8x2_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3269355653 987911951 2963892063 3381857140
conv2d fprop_1x7x8x2_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3748422120 3644341259 2132626684 727104696
conv2d fprop_1x7x8x2_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3748422120 3644341259 2132626684 857884834
conv2d fprop_1x7x9x2_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 472157622 1595526728 1755127071 1773464230
conv2d fprop_1x7x9x2_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 472157622 1595526728 1755127071 1800737809
conv2d fprop_2x7x9x2_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2555494614 224923131 2778187426 1408209490
conv2d fprop_2x7x9x2_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2555494614 224923131 2778187426 113009838
conv2d fprop_3x7x9x2_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2311828961 1219404370 1038140209 1972128042
conv2d fprop_3x7x9x2_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2311828961 1219404370 1038140209 740278031
conv2d fprop_3x7x9x2_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2311828961 2400093115 2381193183 3189138716
conv2d fprop_3x7x9x2_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2311828961 2400093115 2381193183 4117350218
conv2d fprop_3x7x9x2_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2311828961 1018998471 123247934 3895648089
conv2d fprop_3x7x9x2_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2311828961 1018998471 123247934 1801652807
conv2d fprop_1x11x7x2_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2296142491 4250546017 2963892063 1354630
conv2d fprop_1x11x7x2_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2296142491 4250546017 2963892063 1354630
conv2d fprop_1x11x7x2_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2296142491 3644341259 2963892063 2794615982
conv2d fprop_1x11x7x2_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2296142491 3644341259 2963892063 1407282247
conv2d fprop_1x13x11x2_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1218117393 4250546017 2132626684 4169859068
conv2d fprop_1x13x11x2_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1218117393 4250546017 2132626684 4169859068
conv2d fprop_1x17x19x2_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3858018920 3830842503 3268227320 1293623633
conv2d fprop_1x17x19x2_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3858018920 3830842503 3268227320 422114034
conv2d fprop_1x23x5x2_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3131990564 3914955377 2381193183 3106056962
conv2d fprop_1x23x5x2_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3131990564 3914955377 2381193183 3961289412
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3187654522 2811231923 3002932066 332595516
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3187654522 2811231923 3002932066 1038970344
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 939350077 2811231923 3710122981 1390001842
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 939350077 2811231923 3710122981 3516755647
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1957958032 2306828385 341432232 1207552588
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1957958032 2306828385 341432232 2056415706
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4005630370 105489309 212243307 3753643595
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4005630370 105489309 212243307 3753643595
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4148272483 1750065361 2212942576 1337682673
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4148272483 1750065361 2212942576 183620743
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 617040073 350396557 284178850 3286712256
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 617040073 350396557 284178850 2327714256
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2096370412 2318155471 835666052 4141289477
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2096370412 2318155471 835666052 2298284761
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3496218347 2077244131 2929697040 1641694950
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3496218347 2077244131 2929697040 1957029265
conv2d fprop_1x15x19x34_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1926056930 1319256657 950258165 4217829985
conv2d fprop_1x15x19x34_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1926056930 1319256657 950258165 1720028652
conv2d fprop_1x16x24x66_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2388882552 2500591916 3967280674 2026555219
conv2d fprop_1x16x24x66_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2388882552 2500591916 3967280674 2322971508
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 683582756 1395357567 3996211431 3665284572
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 683582756 1395357567 3996211431 201734166
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 982506873 1181458623 2289578760 3612707051
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 982506873 1181458623 2289578760 3612707051
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2185005209 2219118660 1440004873 3463834206
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2185005209 2219118660 1440004873 2512434087
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 613238853 1728048860 3033436585 2458388362
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 613238853 1728048860 3033436585 3613671804
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1261436340 2257098898 3140537372 3075173914
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1261436340 2257098898 3140537372 2600183629
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 254292619 2257098898 2668473724 3607778249
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 254292619 2257098898 2668473724 2808559748
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 772022222 4190341022 1138386226 449926041
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 772022222 4190341022 1138386226 1583119279
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3879922405 2257098898 4106573903 2990552295
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3879922405 2257098898 4106573903 760071194
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3879922405 2257098898 4106573903 2172129453
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3879922405 2257098898 4106573903 3098209529
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2751430422 3535384576 1178225662 264922690
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2751430422 3535384576 1178225662 638310695
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 634689168 1558178565 3438778114 3770158048
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 634689168 1558178565 3438778114 2838908779
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1906326545 268218351 3556752290 4160523498
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1906326545 268218351 3556752290 2865592304
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1481519788 2799725917 1070404771 3297631478
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1481519788 2799725917 1070404771 767059743
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1350987180 3287180835 87918186 1052120585
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1350987180 3287180835 87918186 1681505651
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 864673475 2278914712 345256678 1262388200
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 864673475 2278914712 345256678 301355370
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2136677961 1230883571 535024815 2000875092
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2136677961 1230883571 535024815 1840294626
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_0i_beta2_0i cnhwc_cnhwc_cnhwc_c_c 958260586 595219593 900622494 3754107310
conv2d dgrad_1x1x1x2_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3303215167 4250546017 3890556343 2998602688
conv2d dgrad_1x1x1x2_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3303215167 4250546017 3890556343 2998602688
conv2d dgrad_1x1x8x2_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 987911951 2980124304 2356394714
conv2d dgrad_1x1x8x2_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 987911951 2980124304 4022777716
conv2d dgrad_1x7x8x2_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 874639038 3644341259 802623080 2956519823
conv2d dgrad_1x7x8x2_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 874639038 3644341259 802623080 2062861672
conv2d dgrad_1x7x9x2_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3528407758 1595526728 2738672641 906097834
conv2d dgrad_1x7x9x2_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3528407758 1595526728 2738672641 3836417944
conv2d dgrad_2x7x9x2_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 639343303 224923131 311726682 1416127669
conv2d dgrad_2x7x9x2_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 639343303 224923131 311726682 2471877698
conv2d dgrad_3x7x9x2_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1075488054 1219404370 1146816700 3034531074
conv2d dgrad_3x7x9x2_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1075488054 1219404370 1146816700 4066967351
conv2d dgrad_3x7x9x2_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1325203442 2400093115 1146816700 693310298
conv2d dgrad_3x7x9x2_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1325203442 2400093115 1146816700 3135924868
conv2d dgrad_3x7x9x2_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 558171981 1018998471 1146816700 529330651
conv2d dgrad_3x7x9x2_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 558171981 1018998471 1146816700 2005367170
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3068101001 105489309 1542732212 3932236040
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3068101001 105489309 1542732212 3932236040
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4012287854 350396557 4055318830 3961661564
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4012287854 350396557 4055318830 3131592715
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1814966816 2318155471 2860596382 3615634589
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1814966816 2318155471 2860596382 4068533991
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1112763679 2077244131 923239372 4185176358
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1112763679 2077244131 923239372 2760678679
conv2d dgrad_1x15x19x34_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2216139934 1319256657 2148851182 4222196889
conv2d dgrad_1x15x19x34_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2216139934 1319256657 2148851182 3594057123
conv2d dgrad_1x16x24x66_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 859196912 2500591916 96801657 4090791495
conv2d dgrad_1x16x24x66_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 859196912 2500591916 96801657 3335462877
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1655739745 268218351 1632053434 381883460
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1655739745 268218351 1632053434 2882340861
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 178805580 2799725917 1965113500 2522976436
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 178805580 2799725917 1965113500 733838654
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 857551382 3287180835 3720443806 3464939495
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 857551382 3287180835 3720443806 1609144169
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1587615602 2278914712 424519891 3221010146
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1587615602 2278914712 424519891 2669791026
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2145363230 1230883571 2549378996 2649498772
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2145363230 1230883571 2549378996 3402864639
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_0i_beta2_0i cnhwc_cnhwc_cnhwc_c_c 1762516385 595219593 918164635 3122213356
conv2d wgrad_1x1x1x2_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3303215167 991930693 2980124304 2646402841
conv2d wgrad_1x1x1x2_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3303215167 991930693 2980124304 2646402841
conv2d wgrad_1x1x8x2_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 4250546017 294738383 2839064596
conv2d wgrad_1x1x8x2_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 4250546017 294738383 126798540
conv2d wgrad_1x7x8x2_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 874639038 1478369444 1588130777 3726346872
conv2d wgrad_1x7x8x2_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 874639038 1478369444 1588130777 2751024512
conv2d wgrad_1x7x9x2_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3528407758 3070204399 3036494114 2723605209
conv2d wgrad_1x7x9x2_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3528407758 3070204399 3036494114 1320740478
conv2d wgrad_2x7x9x2_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 639343303 2872812701 1239438433 3682382315
conv2d wgrad_2x7x9x2_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 639343303 2872812701 1239438433 1302999924
conv2d wgrad_3x7x9x2_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1075488054 3373210244 4207987780 1660673899
conv2d wgrad_3x7x9x2_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1075488054 3373210244 4207987780 2714640979
conv2d wgrad_3x7x9x2_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1325203442 3373210244 2381193183 1695826123
conv2d wgrad_3x7x9x2_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1325203442 3373210244 2381193183 805511206
conv2d wgrad_3x7x9x2_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 558171981 3373210244 2224388272 3988056388
conv2d wgrad_3x7x9x2_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 558171981 3373210244 2224388272 3477078834
conv2d wgrad_1x11x7x2_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 1219770266 2980124304 4226893215
conv2d wgrad_1x11x7x2_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 1219770266 2980124304 4226893215
conv2d wgrad_1x11x7x2_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 1219770266 1588130777 507860528
conv2d wgrad_1x11x7x2_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1134921014 1219770266 1588130777 197947685
conv2d wgrad_1x13x11x2_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 874639038 1458935684 2980124304 665196336
conv2d wgrad_1x13x11x2_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 874639038 1458935684 2980124304 665196336
conv2d wgrad_1x17x19x2_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 872104768 2927917918 3840288384 3199099046
conv2d wgrad_1x17x19x2_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 872104768 2927917918 3840288384 4041124990
conv2d wgrad_1x23x5x2_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1325203442 1018974017 2695215306 4046661096
conv2d wgrad_1x23x5x2_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1325203442 1018974017 2695215306 3480351868
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4145273678 2543470756 2731031538 2297420515
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4145273678 2543470756 2731031538 1328037289
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3825093358 4205517202 2731031538 710476466
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3825093358 4205517202 2731031538 2536080878
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1971123277 747484694 1069984549 2363498191
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1971123277 747484694 1069984549 3086819073
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3068101001 2172673608 472330470 2004815062
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3068101001 2172673608 472330470 2004815062
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2733349579 4187797427 4010744414 1794084581
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2733349579 4187797427 4010744414 4114524808
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4012287854 1017126775 3085573007 2255778450
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 4012287854 1017126775 3085573007 1202237741
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1814966816 1352955925 3175962793 2510381785
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1814966816 1352955925 3175962793 1158539581
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1112763679 3236296258 4126085678 2683550287
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1112763679 3236296258 4126085678 405842269
conv2d wgrad_1x15x19x34_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2216139934 1340523375 995921099 1592723627
conv2d wgrad_1x15x19x34_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2216139934 1340523375 995921099 309005134
conv2d wgrad_1x16x24x66_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 859196912 1358310556 2323019560 542694758
conv2d wgrad_1x16x24x66_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 859196912 1358310556 2323019560 2166847633
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2259629017 2475931707 1440799092 4221565216
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2259629017 2475931707 1440799092 3549830349
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3657056888 2153286596 2099843274 1726340662
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3657056888 2153286596 2099843274 1726340662
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1982243752 1023264400 3870616796 3807131300
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1982243752 1023264400 3870616796 1448894569
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2719672358 3720159962 198641006 877490804
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2719672358 3720159962 198641006 1819866268
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3808539997 3824664598 3887066342 1781681130
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 3808539997 3824664598 3887066342 568593004
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 365784208 397970234 3887066342 3219231066
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 365784208 397970234 3887066342 1952799079
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 649647965 4115158715 3687074625 2188687762
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 649647965 4115158715 3687074625 328038371
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2535440624 1855518467 3887066342 3554145843
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2535440624 1855518467 3887066342 629423006
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2535440624 1855518467 3887066342 4234955015
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2535440624 1855518467 3887066342 3741665130
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 575370052 296626169 3843555714 2515434981
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 575370052 296626169 3843555714 2997311698
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 933902974 1680322972 2268084635 947907958
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 933902974 1680322972 2268084635 1668453739
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1655739745 1407675647 3608965793 1545685731
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1655739745 1407675647 3608965793 1560811683
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 178805580 468297304 2081693980 2353241153
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 178805580 468297304 2081693980 3371496143
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 857551382 4022024717 3526617126 2530989957
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 857551382 4022024717 3526617126 1774437661
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1587615602 1932866802 3105677758 658488210
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 1587615602 1932866802 3105677758 3321302287
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2145363230 3735060046 3040777726 2073220474
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_0i_beta0_0i cnhwc_cnhwc_cnhwc_c_c 2145363230 3735060046 3040777726 3382548517
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_0i_beta2_0i cnhwc_cnhwc_cnhwc_c_c 1762516385 36879495 1156311284 3310348499
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2188357494 1769029067 159526285 825535581
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2188357494 1769029067 159526285 825535581
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1838714027 2265452184 2610359861 1987868270
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1838714027 2265452184 2610359861 728956432
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 3971681487 257610791 1008996088
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 3971681487 257610791 2555315413
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2318538354 3316437378 710632830 1863244686
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2318538354 3316437378 710632830 3946357538
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 672199864 3153681330 3307060297 2695612973
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 672199864 3153681330 3307060297 2564657101
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 2700620395 1556396665 2901584122
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 2700620395 1556396665 3078683181
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 3431458505 2293883251 1513830178
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 3431458505 2293883251 1456315771
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 728619567 2638743394 4157930574
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 728619567 2638743394 4280729276
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 1769029067 2610359861 829068145
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 1769029067 2610359861 829068145
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 3971681487 2610359861 3175191801
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 3971681487 2610359861 752965501
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1483240777 1769029067 257610791 1872463282
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1483240777 1769029067 257610791 1872463282
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3878803000 1547628165 652315301 3236250595
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3878803000 1547628165 652315301 115169690
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3474690180 3245600707 2293883251 1373982557
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3474690180 3245600707 2293883251 3038299705
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 876572357 663101280 1784121575 3650717238
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 876572357 663101280 1784121575 1844414540
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2926249914 663101280 1238102800 940361331
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2926249914 663101280 1238102800 1574520323
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 568740975 3647824478 1001821658 763311327
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 568740975 3647824478 1001821658 3755275557
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3351802863 889731117 1862926968 1133541197
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3351802863 889731117 1862926968 1133541197
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3680916718 2931605166 1380790217 1603771059
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3680916718 2931605166 1380790217 1384953419
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 865676658 3292777216 2570824137 1716239002
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 865676658 3292777216 2570824137 1207507795
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3471311976 3069685598 1501287327 2020885449
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3471311976 3069685598 1501287327 3540106320
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2012717243 4183087394 1158072871 2770857658
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2012717243 4183087394 1158072871 2753556152
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2639488807 1127821716 1175487408 1443444693
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2639488807 1127821716 1175487408 2615818500
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4005424028 560055529 3924773317 1674063910
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4005424028 560055529 3924773317 731082069
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2975308389 3388564462 540151004 2747507935
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2975308389 3388564462 540151004 916078700
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1609667174 3347123934 1942443225 927150176
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1609667174 3347123934 1942443225 927150176
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1910152888 4279006666 634623721 1857297775
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1910152888 4279006666 634623721 3617909140
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3020034528 2354621402 3496282292 1893593581
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3020034528 2354621402 3496282292 4168452665
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2432565675 683959930 1993750394 960818057
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2432565675 683959930 1993750394 3831768945
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1094435461 683959930 1546760441 3943198524
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1094435461 683959930 1546760441 297674396
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1881914243 1677559851 2710651669 1457186301
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1881914243 1677559851 2710651669 641199618
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 1219910572
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 2513734798
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 2022987417
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 1691115924
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3831097363 1912090452 140813403 3043290146
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3831097363 1912090452 140813403 2921616453
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1244925287 3609240260 3715463477 2323185695
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1244925287 3609240260 3715463477 1672551923
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3026255423 62170551 337645063 913747685
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3026255423 62170551 337645063 778811608
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3054241601 2539714930 725343835 1284495313
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3054241601 2539714930 725343835 2804300956
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3459414189 2300049969 3590051376 3773230297
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3459414189 2300049969 3590051376 3201976695
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 869473545 972211497 126335800 745587578
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 869473545 972211497 126335800 3427184805
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3759545138 698995736 2260090497 603560103
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3759545138 698995736 2260090497 3440870263
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_hnhwc_h_h 1541569966 3683140111 4057089521 1550530307
conv2d dgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 135000378 4250546017 3890556343 3840696830
conv2d dgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 135000378 4250546017 3890556343 3840696830
conv2d dgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 987911951 2980124304 2572054323
conv2d dgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 987911951 2980124304 4006425566
conv2d dgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1504270762 3644341259 802623080 1655787066
conv2d dgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1504270762 3644341259 802623080 2956350850
conv2d dgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1134921014 1595526728 2738672641 962312341
conv2d dgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1134921014 1595526728 2738672641 3126435132
conv2d dgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1113301030 224923131 311726682 4061102478
conv2d dgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1113301030 224923131 311726682 2314369199
conv2d dgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1431058757 1219404370 1146816700 3996872848
conv2d dgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1431058757 1219404370 1146816700 2269688958
conv2d dgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2568212047 2400093115 1146816700 1719436727
conv2d dgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2568212047 2400093115 1146816700 4236972782
conv2d dgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2133636964 1018998471 1146816700 1307853167
conv2d dgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2133636964 1018998471 1146816700 469937848
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1126681227 4265921531 1307969125 2041137857
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1126681227 4265921531 1307969125 2041137857
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3363792845 2766914163 1541598000 562462849
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3363792845 2766914163 1541598000 585918261
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2017514189 3050624323 2813830197 3551637995
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2017514189 3050624323 2813830197 2284323213
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2136362147 1633048603 2983167436 866644788
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2136362147 1633048603 2983167436 253066315
conv2d dgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 784928777 2467457616 1092494080 274183605
conv2d dgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 784928777 2467457616 1092494080 1241514327
conv2d dgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1928121195 1319256657 3541920582 2018009151
conv2d dgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1928121195 1319256657 3541920582 1303918704
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1089703540 3724098469 2351024902 941952011
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1089703540 3724098469 2351024902 3577527602
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1527509174 840940128 2574042419 2518679986
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1527509174 840940128 2574042419 3797768014
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3153833039 3274942180 3438778114 508409341
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3153833039 3274942180 3438778114 3918768286
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 805200720 617641393 2145192778 3649177283
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 805200720 617641393 2145192778 2392118609
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3916058745 721318312 535024815 4039199216
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3916058745 721318312 535024815 2891577765
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 fnhwc_fnhwc_fnhwc_f_f 3160120111 12477519 1682007569 2212069629
conv2d wgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 135000378 991930693 2980124304 2169312899
conv2d wgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 135000378 991930693 2980124304 2169312899
conv2d wgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 4250546017 294738383 1067638259
conv2d wgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 4250546017 294738383 504959928
conv2d wgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1504270762 1478369444 1588130777 587511439
conv2d wgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1504270762 1478369444 1588130777 3767308084
conv2d wgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1134921014 3070204399 3036494114 4124366680
conv2d wgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1134921014 3070204399 3036494114 2833785422
conv2d wgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1113301030 2872812701 1239438433 1775116239
conv2d wgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1113301030 2872812701 1239438433 1288542483
conv2d wgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1431058757 3373210244 4207987780 4054255409
conv2d wgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1431058757 3373210244 4207987780 180834054
conv2d wgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2568212047 3373210244 2381193183 353843599
conv2d wgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2568212047 3373210244 2381193183 1860329513
conv2d wgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2133636964 3373210244 2224388272 347055977
conv2d wgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2133636964 3373210244 2224388272 994788649
conv2d wgrad_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 1219770266 2980124304 1448608264
conv2d wgrad_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 1219770266 2980124304 1448608264
conv2d wgrad_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 1219770266 1588130777 2381531672
conv2d wgrad_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1501031342 1219770266 1588130777 3417974847
conv2d wgrad_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1504270762 1458935684 2980124304 2512582600
conv2d wgrad_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1504270762 1458935684 2980124304 2512582600
conv2d wgrad_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1642334467 2927917918 3840288384 2880620663
conv2d wgrad_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1642334467 2927917918 3840288384 2552969500
conv2d wgrad_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2568212047 1018974017 2695215306 3059274099
conv2d wgrad_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2568212047 1018974017 2695215306 3436607346
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1325203442 2973628448 3097125139 3643918743
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1325203442 2973628448 3097125139 747082267
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1075488054 4153253284 3097125139 21340657
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1075488054 4153253284 3097125139 56227083
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2373792510 4228778230 3268227320 2781787969
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2373792510 4228778230 3268227320 4054149767
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1126681227 448814756 4020828414 692686929
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1126681227 448814756 4020828414 692686929
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 4098697864 2355686406 2621782130 2833949486
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 4098697864 2355686406 2621782130 3251496823
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3363792845 68416507 3062073018 220836046
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3363792845 68416507 3062073018 1707620502
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2017514189 2695053579 4119019906 338363935
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2017514189 2695053579 4119019906 738717986
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2136362147 2323702535 2730633195 4275642741
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2136362147 2323702535 2730633195 3105473059
conv2d wgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 784928777 3920994243 2871183684 1457368860
conv2d wgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 784928777 3920994243 2871183684 2129608645
conv2d wgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1928121195 1834136816 995921099 1290832901
conv2d wgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1928121195 1834136816 995921099 154477589
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3829716048 824597450 3596813277 3377048584
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3829716048 824597450 3596813277 412509722
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1276391848 1858648938 3730143675 2712417789
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1276391848 1858648938 3730143675 2712417789
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2991748655 996994755 3162712336 2691220362
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2991748655 996994755 3162712336 3441232209
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 613238853 3737415653 1813717058 3953491679
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 613238853 3737415653 1813717058 1261891081
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3074259140 3369591202 2081693980 3439473075
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3074259140 3369591202 2081693980 3352279175
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2475424603 3047230488 2081693980 3359165930
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 2475424603 3047230488 2081693980 1942009480
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3980242078 2830864967 1000406280 332157749
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3980242078 2830864967 1000406280 2601063004
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 870738555 640024666 2081693980 4100031453
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 870738555 640024666 2081693980 1919107176
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 870738555 640024666 2081693980 1618717912
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 870738555 640024666 2081693980 221251170
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1467525936 2166215692 2099843274 1752033731
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1467525936 2166215692 2099843274 2254410747
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1441608968 3983207745 3357056235 4220059751
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1441608968 3983207745 3357056235 3334646036
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1089703540 1191155361 852881505 1729883415
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1089703540 1191155361 852881505 3112064590
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1527509174 2779255425 1217669626 2313445327
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 1527509174 2779255425 1217669626 2378687243
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3153833039 1258133396 2989357662 2523233417
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3153833039 1258133396 2989357662 845687444
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 805200720 858259717 3333097025 2967627788
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 805200720 858259717 3333097025 285381561
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3916058745 443607763 3443985888 4252958697
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 fnhwc_fnhwc_fnhwc_f_f 3916058745 443607763 3443985888 160172027
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 fnhwc_fnhwc_fnhwc_f_f 3160120111 1536824438 422976060 2522704893

View File

@ -0,0 +1,207 @@
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2188357494 1769029067 159526285 825535581
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2188357494 1769029067 159526285 825535581
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1838714027 2265452184 2610359861 1987868270
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1838714027 2265452184 2610359861 728956432
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 3971681487 257610791 1008996088
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 3971681487 257610791 2555315413
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2318538354 3316437378 710632830 1863244686
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2318538354 3316437378 710632830 3946357538
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 672199864 3153681330 3307060297 2695612973
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 672199864 3153681330 3307060297 2564657101
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 2700620395 1556396665 2901584122
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 2700620395 1556396665 3078683181
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 3431458505 2293883251 1513830178
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 3431458505 2293883251 1456315771
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 728619567 2638743394 4157930574
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3966476684 728619567 2638743394 4280729276
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 1769029067 2610359861 829068145
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 1769029067 2610359861 829068145
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 3971681487 2610359861 3175191801
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2760870769 3971681487 2610359861 752965501
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1483240777 1769029067 257610791 1872463282
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1483240777 1769029067 257610791 1872463282
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3878803000 1547628165 652315301 3236250595
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3878803000 1547628165 652315301 115169690
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3474690180 3245600707 2293883251 1373982557
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3474690180 3245600707 2293883251 3038299705
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 876572357 663101280 1784121575 3650717238
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 876572357 663101280 1784121575 1844414540
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2926249914 663101280 1238102800 940361331
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2926249914 663101280 1238102800 1574520323
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 568740975 3647824478 1001821658 763311327
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 568740975 3647824478 1001821658 3755275557
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3351802863 889731117 1862926968 1133541197
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3351802863 889731117 1862926968 1133541197
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3680916718 2931605166 1380790217 1603771059
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3680916718 2931605166 1380790217 1384953419
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 865676658 3292777216 2570824137 1716239002
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 865676658 3292777216 2570824137 1207507795
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3471311976 3069685598 1501287327 2020885449
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3471311976 3069685598 1501287327 3540106320
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2012717243 4183087394 1158072871 2770857658
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2012717243 4183087394 1158072871 2753556152
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2639488807 1127821716 1175487408 1443444693
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2639488807 1127821716 1175487408 2615818500
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4005424028 560055529 3924773317 1674063910
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4005424028 560055529 3924773317 731082069
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2975308389 3388564462 540151004 2747507935
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2975308389 3388564462 540151004 916078700
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1609667174 3347123934 1942443225 927150176
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1609667174 3347123934 1942443225 927150176
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1910152888 4279006666 634623721 1857297775
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1910152888 4279006666 634623721 3617909140
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3020034528 2354621402 3496282292 1893593581
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3020034528 2354621402 3496282292 4168452665
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2432565675 683959930 1993750394 960818057
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2432565675 683959930 1993750394 3831768945
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1094435461 683959930 1546760441 3943198524
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1094435461 683959930 1546760441 297674396
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1881914243 1677559851 2710651669 1457186301
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1881914243 1677559851 2710651669 641199618
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 1219910572
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 2513734798
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 2022987417
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3323210016 683959930 3090812263 1691115924
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3831097363 1912090452 140813403 3043290146
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3831097363 1912090452 140813403 2921616453
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1244925287 3609240260 3715463477 2323185695
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1244925287 3609240260 3715463477 1672551923
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3026255423 62170551 337645063 913747685
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3026255423 62170551 337645063 778811608
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3054241601 2539714930 725343835 1284495313
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3054241601 2539714930 725343835 2804300956
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3459414189 2300049969 3590051376 3773230297
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3459414189 2300049969 3590051376 3201976695
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 869473545 972211497 126335800 745587578
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 869473545 972211497 126335800 3427184805
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3759545138 698995736 2260090497 603560103
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3759545138 698995736 2260090497 3440870263
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_hnhwc_h_h 1541569966 3683140111 4057089521 1550530307
conv2d fprop_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 439881880 2361007913 550417941
conv2d fprop_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 439881880 2361007913 511192308
conv2d fprop_1x4x4x14_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2604126736 2435640339 2361007913 968601759
conv2d fprop_1x4x4x14_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2604126736 2435640339 2361007913 144578446
conv2d fprop_1x23x56x98_10x22_128x3x3_pad_h4w5_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4198134089 972211497 1394525436 3504696155
conv2d fprop_1x23x56x98_10x22_128x3x3_pad_h4w5_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4198134089 972211497 1394525436 3698098218
conv2d fprop_1x4x4x28_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 1672619248 2361007913 1369103290
conv2d fprop_1x4x4x28_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 1672619248 2361007913 489904325
conv2d fprop_1x23x56x100_10x22_128x3x3_pad_h4w5_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4291047527 2579050400 1394525436 351315258
conv2d fprop_1x23x56x100_10x22_128x3x3_pad_h4w5_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4291047527 2579050400 1394525436 1597164252
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 882369639 1769029067 2361007913 2527823846
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 882369639 1769029067 2361007913 2527823846
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 2265452184 1363379414 300054115
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 2265452184 1363379414 3807580965
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 3971681487 257610791 2386732272
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 3971681487 257610791 4258410038
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1057722415 3316437378 889102087 2570634199
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1057722415 3316437378 889102087 171700712
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1856996643 3153681330 2728188831 2975997856
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1856996643 3153681330 2728188831 2889418578
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3890032868 2700620395 2547817029 3967064079
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3890032868 2700620395 2547817029 3184265450
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3787596573 3431458505 2547817029 964612107
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3787596573 3431458505 2547817029 2037559507
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3247824247 728619567 2547817029 3557273069
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3247824247 728619567 2547817029 4397155
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 74280264 889731117 1508034024 1365806907
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 74280264 889731117 1508034024 1365806907
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1282400930 3292777216 2278368940 8357438
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1282400930 3292777216 2278368940 226365504
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4245845173 3069685598 99670743 325988631
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4245845173 3069685598 99670743 2434233848
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2504130563 4183087394 1801140850 1590712227
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2504130563 4183087394 1801140850 2545352669
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1766181903 1127821716 1260519450 2958285630
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1766181903 1127821716 1260519450 3013578259
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 183183414 560055529 2304892275 2542844870
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 183183414 560055529 2304892275 2460120362
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 202999757 62170551 888583293 630899132
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 202999757 62170551 888583293 2651936157
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 64770922 2539714930 291707000 1632621462
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 64770922 2539714930 291707000 2196326316
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1553906912 2300049969 270479912 1418534287
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1553906912 2300049969 270479912 2969883907
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4010944083 972211497 2352115326 3241394959
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4010944083 972211497 2352115326 3084585540
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 920147836 698995736 4291786732 4085488230
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 920147836 698995736 4291786732 65254192
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_hnhwc_h_h 2823085435 3683140111 2381613519 4075620655
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 882369639 2469118171 1363379414 2536698895
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 882369639 2469118171 1363379414 2536698895
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 1769029067 2610359861 2675562568
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 1769029067 2610359861 931542610
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 4237122930 2293883251 3279943011
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 4237122930 2293883251 2971660764
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1057722415 4274209342 2000691267 560753121
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1057722415 4274209342 2000691267 2154075967
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1856996643 2435640339 4206304784 607086828
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1856996643 2435640339 4206304784 1740786933
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3890032868 3485693384 722716191 534106900
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3890032868 3485693384 722716191 1330324832
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3787596573 3485693384 2298261608 3272993277
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3787596573 3485693384 2298261608 809879168
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3247824247 3485693384 677398494 3545662177
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3247824247 3485693384 677398494 406656675
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 4228252800 1363379414 1916931500
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 4228252800 1363379414 1916931500
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 4228252800 2293883251 2596039814
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1089974555 4228252800 2293883251 2187291295
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 27036473 1363379414 1933529223
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 702641729 27036473 1363379414 1933529223
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2903517501 1191123585 2874079035 3411667027
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2903517501 1191123585 2874079035 803905560
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3787596573 598080595 1784121575 644569158
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3787596573 598080595 1784121575 2373347066
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3227777797 329714136 2976030512 1014758557
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3227777797 329714136 2976030512 3940634369
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2301757939 1530947948 2976030512 3694497516
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2301757939 1530947948 2976030512 835787843
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2617901288 2993361563 1502330852 2213153149
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2617901288 2993361563 1502330852 4284874546
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 74280264 1916026608 2010130163 369232966
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 74280264 1916026608 2010130163 369232966
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1666425148 2767428662 2279791261 4027210146
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1666425148 2767428662 2279791261 1318730126
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1282400930 2713937462 3240894382 506695315
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1282400930 2713937462 3240894382 816815166
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4245845173 1573282079 3850186149 4106577752
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4245845173 1573282079 3850186149 355691834
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2504130563 4047167459 2936630712 348206756
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2504130563 4047167459 2936630712 2784859021
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1766181903 4273504437 787340207 1859862221
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1766181903 4273504437 787340207 3725886099
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 183183414 3105456251 3826106137 974970753
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 183183414 3105456251 3826106137 3416657232
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3483168388 424125191 908150856 1561140377
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3483168388 424125191 908150856 188844017
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 556825749 1391936148 2475632360 2800518880
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 556825749 1391936148 2475632360 2800518880
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3638123775 1173557136 2296711591 633157930
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3638123775 1173557136 2296711591 2368475048
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 649525056 3855280460 3101885145 2961254635
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 649525056 3855280460 3101885145 3741625104
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2173736421 3547027896 2104091502 3064810292
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2173736421 3547027896 2104091502 3713272088
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2709957180 1282487297 2104091502 744834192
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2709957180 1282487297 2104091502 904876309
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3651249563 4031283235 1508206782 2694170352
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3651249563 4031283235 1508206782 3908734231
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3355104310 3659562123 2104091502 2337157193
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3355104310 3659562123 2104091502 2313638308
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3355104310 3659562123 2104091502 3685548808
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 3355104310 3659562123 2104091502 2598517610
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2990284284 1468341695 784812405 1657604983
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 2990284284 1468341695 784812405 1091864392
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 777450620 1302452628 2792629935 1858657589
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 777450620 1302452628 2792629935 17882029
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 202999757 1750335029 2181422926 4235795050
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 202999757 1750335029 2181422926 4023494188
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 64770922 821682484 2518007336 481779259
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 64770922 821682484 2518007336 973321278
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1553906912 3381440542 537676326 3225233411
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 1553906912 3381440542 537676326 1804899744
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4010944083 3959973438 1089446814 942114500
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 4010944083 3959973438 1089446814 3331001854
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 920147836 2098470176 1991739118 2991567146
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_h_h 920147836 2098470176 1991739118 244560469
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_hnhwc_h_h 2823085435 2750615938 1907430051 3805642950

View File

@ -0,0 +1,197 @@
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1152388039 486967919 3706990238
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1152388039 486967919 3706990238
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1585175937 2411745115 1919973277 506127908
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1585175937 2411745115 1919973277 2193864160
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 3872812830
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2445012180
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3892602751 3987447721 2963892063 3556328678
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3892602751 3987447721 2963892063 2088376980
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1647798936 1986983586 3862463878 498933688
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1647798936 1986983586 3862463878 2581533408
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 3844983048 373331791 3515334098
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 3844983048 373331791 2566159340
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 741820436 2695215306 4235633178
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 741820436 2695215306 815310604
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 2188679282 2132201986 1043483661
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 2188679282 2132201986 2172013863
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 1152388039 1919973277 1836150764
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 1152388039 1919973277 1836150764
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 4021016722 1919973277 3537245111
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 4021016722 1919973277 1166347001
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3708184432 1152388039 1911021900 4188669650
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3708184432 1152388039 1911021900 4188669650
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3793481427 2784674253 5067603 3709403009
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3793481427 2784674253 5067603 3666537740
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 724504571 866495443 2695215306 2273666993
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 724504571 866495443 2695215306 3277012289
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3696992523 2499748007 2381193183 4256475381
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3696992523 2499748007 2381193183 868016148
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3999848747 2499748007 1038140209 3720347250
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3999848747 2499748007 1038140209 3079806253
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1193090006 2131084833 720746870 1441382904
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1193090006 2131084833 720746870 2400159337
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3123356211 67170595 2290618404 1832291434
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3123356211 67170595 2290618404 1832291434
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 374093114 3867270480 2959096809 3957922181
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 374093114 3867270480 2959096809 855145836
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3983093985 3903005020 613201518 1067564721
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3983093985 3903005020 613201518 3116342099
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3167361585 764195688 167104692 3451521719
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3167361585 764195688 167104692 2267030515
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2514717945 2683853778 2557576548 3978291544
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2514717945 2683853778 2557576548 2608287914
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1072544153 768805504 1993107524 2984226313
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1072544153 768805504 1993107524 3008259681
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3875284691 1195875134 1041989393 1900995663
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3875284691 1195875134 1041989393 392783151
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3179965682 1961598694 1222599802 2151043714
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3179965682 1961598694 1222599802 1013916354
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2615784276 3832095556 1454859747 958765281
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2615784276 3832095556 1454859747 958765281
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 674692187 808380753 1933240382 879488563
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 674692187 808380753 1933240382 1399508988
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 961566038 2529610490 1966904362 1818870269
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 961566038 2529610490 1966904362 2484388308
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3562503578 4021646304 3426919182 4130346493
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3562503578 4021646304 3426919182 3486420438
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1144321310 4021646304 4185476157 964986272
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1144321310 4021646304 4185476157 1800819557
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3153402236 2244058322 623381239 4197612113
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3153402236 2244058322 623381239 2816226027
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 438913488
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 2812015344
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 307241203
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 3413043496
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4047780986 3796154296 3933470176 2042558105
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4047780986 3796154296 3933470176 2082898655
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4196208609 640419443 3879567407 3126196765
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4196208609 640419443 3879567407 370340580
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1494714374 785253250 1954437668 16145912
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1494714374 785253250 1954437668 352471766
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4104811786 417350231 2268084635 3829320356
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4104811786 417350231 2268084635 3317921115
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3747780903 2173099720 1217977439 3831700802
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3747780903 2173099720 1217977439 2066501805
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2475183841 2416021807 90427526 3879607464
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2475183841 2416021807 90427526 3914420497
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 835429033 3252222904 934864596 2610068735
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 835429033 3252222904 934864596 4160630405
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 83915378 2330495260 722450442 220865236
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 1152388039 1036082506 2004021933
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 1152388039 1036082506 2004021933
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 2411745115 1585402383 692064357
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 2411745115 1585402383 3191762167
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2493803192
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2915688271
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3987447721 311726682 356690874
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3987447721 311726682 3600277581
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 1986983586 1898068767 1480022038
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 1986983586 1898068767 1482170634
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 3844983048 3628298618 1684782062
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 3844983048 3628298618 1312771437
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 741820436 3628298618 3927854537
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 741820436 3628298618 3753859236
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 2188679282 3628298618 331956491
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 2188679282 3628298618 3514953364
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 67170595 1307969125 1500995359
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 67170595 1307969125 1500995359
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 3903005020 1541598000 4224357357
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 3903005020 1541598000 1962390570
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 764195688 2813830197 3377586111
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 764195688 2813830197 1315372741
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 2683853778 2983167436 324191835
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 2683853778 2983167436 1085373547
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 768805504 3823519277 1916712483
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 768805504 3823519277 1584393587
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 1195875134 2636428043 1173364286
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 1195875134 2636428043 4109782860
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 785253250 2351024902 3316943078
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 785253250 2351024902 1065622134
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 417350231 2574042419 294608043
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 417350231 2574042419 491435109
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 2173099720 3438778114 3788164138
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 2173099720 3438778114 2104210385
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 2416021807 2145192778 2640510765
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 2416021807 2145192778 2748647248
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3252222904 535024815 169162784
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3252222904 535024815 3841086721
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 2329920945 2330495260 1682007569 215965178
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 3282100285 1585402383 820104967
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 3282100285 1585402383 820104967
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 1919973277 4103626856
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 1919973277 4164492975
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 2527774459 2695215306 1519678771
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 2527774459 2695215306 4056436284
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3488761154 1737428004 2359527095
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3488761154 1737428004 2240340004
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 2242491745 475190714 3363555017
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 2242491745 475190714 2240937477
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 1231166805 3030543492 1587793687
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 1231166805 3030543492 4129044530
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 1231166805 3002932066 1436246794
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 1231166805 3002932066 2860692730
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 1231166805 2704246666 3831504826
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 1231166805 2704246666 932276705
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 1585402383 584217576
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 1585402383 584217576
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 2695215306 644274899
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 2695215306 2070383610
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 3269716347 1585402383 2091838742
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 3269716347 1585402383 2091838742
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2208297031 3036494114 1391639360
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2208297031 3036494114 2853291206
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 3638907161 2381193183 4076043307
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 3638907161 2381193183 162466399
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 1748311260 3097125139 1760368998
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 1748311260 3097125139 370487040
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 950177617 3097125139 2441672462
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 950177617 3097125139 4093130692
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 3223936144 3268227320 3407045986
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 3223936144 3268227320 3327506975
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 2413111238 4020828414 3782469663
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 2413111238 4020828414 3782469663
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 1849062825 2621782130 1997835815
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 1849062825 2621782130 2176605786
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 1028019427 3062073018 1532225578
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 1028019427 3062073018 3175924537
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 665408258 4119019906 3070068838
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 665408258 4119019906 4095170522
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 1329921014 2730633195 1859011130
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 1329921014 2730633195 1829382848
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 654394569 180842421 456267566
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 654394569 180842421 4065629708
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 792561864 3949436648 2346117136
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 792561864 3949436648 3375703263
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 2182213461 3596813277 2680766255
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 2182213461 3596813277 819444109
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 4284293314 3730143675 2330242371
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 4284293314 3730143675 2330242371
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 1488124595 3162712336 2186928678
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 1488124595 3162712336 4038147074
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 1324698024 1813717058 1491574211
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 1324698024 1813717058 664642450
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 1617738198 2081693980 1691976762
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 1617738198 2081693980 1352928468
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 169231440 2081693980 4154079864
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 169231440 2081693980 49240552
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 1111691860 1000406280 1708014479
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 1111691860 1000406280 2976393539
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 141423768
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 1807012226
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 4065587708
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 3621154478
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 4018387624 2099843274 3166971951
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 4018387624 2099843274 710495809
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 1007447386 3357056235 3446932548
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 1007447386 3357056235 344178277
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 4040055257 852881505 1633246355
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 4040055257 852881505 778858244
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 428926092 1217669626 1090782686
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 428926092 1217669626 1523455590
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 1787889194 2989357662 3134613422
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 1787889194 2989357662 1158845444
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 857847029 3333097025 3239572160
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 857847029 3333097025 2436320376
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3294874067 3443985888 4083335585
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3294874067 3443985888 3302917564
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 2329920945 531242570 422976060 2227466455

View File

@ -0,0 +1,472 @@
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1152388039 486967919 3706990238
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1152388039 486967919 3706990238
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1585175937 2411745115 1919973277 506127908
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1585175937 2411745115 1919973277 2193864160
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 3872812830
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2445012180
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3892602751 3987447721 2963892063 3556328678
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3892602751 3987447721 2963892063 2088376980
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1647798936 1986983586 3862463878 498933688
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1647798936 1986983586 3862463878 2581533408
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 3844983048 373331791 3515334098
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 3844983048 373331791 2566159340
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 741820436 2695215306 4235633178
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 741820436 2695215306 815310604
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 2188679282 2132201986 1043483661
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 2188679282 2132201986 2172013863
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 1152388039 1919973277 1836150764
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 1152388039 1919973277 1836150764
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 4021016722 1919973277 3537245111
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 4021016722 1919973277 1166347001
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3708184432 1152388039 1911021900 4188669650
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3708184432 1152388039 1911021900 4188669650
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3793481427 2784674253 5067603 3709403009
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3793481427 2784674253 5067603 3666537740
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 724504571 866495443 2695215306 2273666993
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 724504571 866495443 2695215306 3277012289
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3696992523 2499748007 2381193183 4256475381
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3696992523 2499748007 2381193183 868016148
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3999848747 2499748007 1038140209 3720347250
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3999848747 2499748007 1038140209 3079806253
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1193090006 2131084833 720746870 1441382904
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1193090006 2131084833 720746870 2400159337
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3123356211 67170595 2290618404 1832291434
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3123356211 67170595 2290618404 1832291434
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 374093114 3867270480 2959096809 3957922181
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 374093114 3867270480 2959096809 855145836
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3983093985 3903005020 613201518 1067564721
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3983093985 3903005020 613201518 3116342099
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3167361585 764195688 167104692 3451521719
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3167361585 764195688 167104692 2267030515
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2514717945 2683853778 2557576548 3978291544
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2514717945 2683853778 2557576548 2608287914
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1072544153 768805504 1993107524 2984226313
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1072544153 768805504 1993107524 3008259681
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3875284691 1195875134 1041989393 1900995663
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3875284691 1195875134 1041989393 392783151
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3179965682 1961598694 1222599802 2151043714
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3179965682 1961598694 1222599802 1013916354
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2615784276 3832095556 1454859747 958765281
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2615784276 3832095556 1454859747 958765281
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 674692187 808380753 1933240382 879488563
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 674692187 808380753 1933240382 1399508988
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 961566038 2529610490 1966904362 1818870269
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 961566038 2529610490 1966904362 2484388308
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3562503578 4021646304 3426919182 4130346493
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3562503578 4021646304 3426919182 3486420438
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1144321310 4021646304 4185476157 964986272
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1144321310 4021646304 4185476157 1800819557
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3153402236 2244058322 623381239 4197612113
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3153402236 2244058322 623381239 2816226027
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 438913488
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 2812015344
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 307241203
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 3413043496
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4047780986 3796154296 3933470176 2042558105
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4047780986 3796154296 3933470176 2082898655
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4196208609 640419443 3879567407 3126196765
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4196208609 640419443 3879567407 370340580
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1494714374 785253250 1954437668 16145912
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1494714374 785253250 1954437668 352471766
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4104811786 417350231 2268084635 3829320356
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4104811786 417350231 2268084635 3317921115
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3747780903 2173099720 1217977439 3831700802
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3747780903 2173099720 1217977439 2066501805
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2475183841 2416021807 90427526 3879607464
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2475183841 2416021807 90427526 3914420497
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 835429033 3252222904 934864596 2610068735
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 835429033 3252222904 934864596 4160630405
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 83915378 2330495260 722450442 220865236
conv2d fprop_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1189071464 1036082506 1072586342
conv2d fprop_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1189071464 1036082506 3209300743
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 1152388039 1036082506 2004021933
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 1152388039 1036082506 2004021933
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 2411745115 1585402383 692064357
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 2411745115 1585402383 3191762167
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2493803192
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2915688271
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3987447721 311726682 356690874
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3987447721 311726682 3600277581
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 1986983586 1898068767 1480022038
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 1986983586 1898068767 1482170634
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 3844983048 3628298618 1684782062
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 3844983048 3628298618 1312771437
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 741820436 3628298618 3927854537
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 741820436 3628298618 3753859236
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 2188679282 3628298618 331956491
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 2188679282 3628298618 3514953364
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 67170595 1307969125 1500995359
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 67170595 1307969125 1500995359
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 3903005020 1541598000 4224357357
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 3903005020 1541598000 1962390570
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 764195688 2813830197 3377586111
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 764195688 2813830197 1315372741
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 2683853778 2983167436 324191835
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 2683853778 2983167436 1085373547
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 768805504 3823519277 1916712483
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 768805504 3823519277 1584393587
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 1195875134 2636428043 1173364286
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 1195875134 2636428043 4109782860
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 785253250 2351024902 3316943078
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 785253250 2351024902 1065622134
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 417350231 2574042419 294608043
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 417350231 2574042419 491435109
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 2173099720 3438778114 3788164138
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 2173099720 3438778114 2104210385
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 2416021807 2145192778 2640510765
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 2416021807 2145192778 2748647248
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3252222904 535024815 169162784
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3252222904 535024815 3841086721
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 2329920945 2330495260 1682007569 215965178
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 3282100285 1585402383 820104967
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 3282100285 1585402383 820104967
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 1919973277 4103626856
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 1919973277 4164492975
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 2527774459 2695215306 1519678771
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 2527774459 2695215306 4056436284
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3488761154 1737428004 2359527095
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3488761154 1737428004 2240340004
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 2242491745 475190714 3363555017
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 2242491745 475190714 2240937477
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 1231166805 3030543492 1587793687
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 1231166805 3030543492 4129044530
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 1231166805 3002932066 1436246794
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 1231166805 3002932066 2860692730
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 1231166805 2704246666 3831504826
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 1231166805 2704246666 932276705
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 1585402383 584217576
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 1585402383 584217576
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 2695215306 644274899
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 2695215306 2070383610
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 3269716347 1585402383 2091838742
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 3269716347 1585402383 2091838742
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2208297031 3036494114 1391639360
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2208297031 3036494114 2853291206
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 3638907161 2381193183 4076043307
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 3638907161 2381193183 162466399
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 1748311260 3097125139 1760368998
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 1748311260 3097125139 370487040
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 950177617 3097125139 2441672462
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 950177617 3097125139 4093130692
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 3223936144 3268227320 3407045986
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 3223936144 3268227320 3327506975
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 2413111238 4020828414 3782469663
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 2413111238 4020828414 3782469663
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 1849062825 2621782130 1997835815
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 1849062825 2621782130 2176605786
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 1028019427 3062073018 1532225578
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 1028019427 3062073018 3175924537
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 665408258 4119019906 3070068838
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 665408258 4119019906 4095170522
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 1329921014 2730633195 1859011130
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 1329921014 2730633195 1829382848
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 654394569 180842421 456267566
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 654394569 180842421 4065629708
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 792561864 3949436648 2346117136
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 792561864 3949436648 3375703263
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 2182213461 3596813277 2680766255
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 2182213461 3596813277 819444109
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 4284293314 3730143675 2330242371
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 4284293314 3730143675 2330242371
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 1488124595 3162712336 2186928678
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 1488124595 3162712336 4038147074
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 1324698024 1813717058 1491574211
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 1324698024 1813717058 664642450
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 1617738198 2081693980 1691976762
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 1617738198 2081693980 1352928468
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 169231440 2081693980 4154079864
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 169231440 2081693980 49240552
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 1111691860 1000406280 1708014479
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 1111691860 1000406280 2976393539
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 141423768
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 1807012226
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 4065587708
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 3621154478
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 4018387624 2099843274 3166971951
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 4018387624 2099843274 710495809
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 1007447386 3357056235 3446932548
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 1007447386 3357056235 344178277
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 4040055257 852881505 1633246355
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 4040055257 852881505 778858244
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 428926092 1217669626 1090782686
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 428926092 1217669626 1523455590
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 1787889194 2989357662 3134613422
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 1787889194 2989357662 1158845444
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 857847029 3333097025 3239572160
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 857847029 3333097025 2436320376
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3294874067 3443985888 4083335585
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3294874067 3443985888 3302917564
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 2329920945 531242570 422976060 2227466455
conv2d wgrad_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 2411745115 1138813722 1312614816
conv2d wgrad_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 2411745115 1138813722 4095449788
conv2d_with_broadcast fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 542905940 1152388039 4158385867 734550470
conv2d_with_broadcast fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 542905940 1152388039 4158385867 734550470
conv2d_with_broadcast fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1585175937 2411745115 3960856459 2498726848
conv2d_with_broadcast fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1585175937 2411745115 3960856459 2808936497
conv2d_with_broadcast fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2793112873 4021016722 3736889909 775549951
conv2d_with_broadcast fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2793112873 4021016722 3736889909 999245167
conv2d_with_broadcast fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3892602751 3987447721 1048231784 3578965759
conv2d_with_broadcast fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3892602751 3987447721 1048231784 3635477992
conv2d_with_broadcast fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1647798936 1986983586 2046300236 942258126
conv2d_with_broadcast fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1647798936 1986983586 2046300236 3024889990
conv2d_with_broadcast fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 3844983048 1063165266 1754355425
conv2d_with_broadcast fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 3844983048 1063165266 3524504078
conv2d_with_broadcast fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 741820436 4160104467 1904546220
conv2d_with_broadcast fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 741820436 4160104467 3380363267
conv2d_with_broadcast fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 2188679282 2508923337 202634559
conv2d_with_broadcast fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 2188679282 2508923337 129526502
conv2d_with_broadcast fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 1152388039 3960856459 687707885
conv2d_with_broadcast fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 1152388039 3960856459 687707885
conv2d_with_broadcast fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 4021016722 3960856459 551076377
conv2d_with_broadcast fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 4021016722 3960856459 2736700182
conv2d_with_broadcast fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3708184432 1152388039 3736889909 3070080445
conv2d_with_broadcast fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3708184432 1152388039 3736889909 3070080445
conv2d_with_broadcast fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3793481427 2784674253 206323080 4139449287
conv2d_with_broadcast fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3793481427 2784674253 206323080 37247821
conv2d_with_broadcast fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 724504571 866495443 4160104467 4166513007
conv2d_with_broadcast fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 724504571 866495443 4160104467 4147817279
conv2d_with_broadcast fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3696992523 2499748007 798339031 2425875414
conv2d_with_broadcast fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3696992523 2499748007 798339031 3318636886
conv2d_with_broadcast fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3999848747 2499748007 3897780943 1663875047
conv2d_with_broadcast fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3999848747 2499748007 3897780943 433625993
conv2d_with_broadcast fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1193090006 2131084833 1626339432 2602241257
conv2d_with_broadcast fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1193090006 2131084833 1626339432 2541313003
conv2d_with_broadcast fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3123356211 67170595 363851176 2694787359
conv2d_with_broadcast fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3123356211 67170595 363851176 2694787359
conv2d_with_broadcast fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 374093114 3867270480 3627748989 1042228997
conv2d_with_broadcast fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 374093114 3867270480 3627748989 2764787715
conv2d_with_broadcast fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3983093985 3903005020 2973635008 4245228167
conv2d_with_broadcast fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3983093985 3903005020 2973635008 2011478650
conv2d_with_broadcast fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3167361585 764195688 1462303962 1213873906
conv2d_with_broadcast fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3167361585 764195688 1462303962 3997555577
conv2d_with_broadcast fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2514717945 2683853778 864525589 2026195616
conv2d_with_broadcast fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2514717945 2683853778 864525589 1429180818
conv2d_with_broadcast fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1072544153 768805504 2851440397 1223626417
conv2d_with_broadcast fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1072544153 768805504 2851440397 4064809744
conv2d_with_broadcast fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3875284691 1195875134 1294114950 3478825820
conv2d_with_broadcast fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3875284691 1195875134 1294114950 2402092772
conv2d_with_broadcast fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3179965682 1961598694 1473372001 2976087551
conv2d_with_broadcast fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3179965682 1961598694 1473372001 2952357814
conv2d_with_broadcast fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2615784276 3832095556 3136842101 4100457990
conv2d_with_broadcast fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2615784276 3832095556 3136842101 4100457990
conv2d_with_broadcast fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 674692187 808380753 3300005124 3291766543
conv2d_with_broadcast fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 674692187 808380753 3300005124 932781825
conv2d_with_broadcast fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 2529610490 3633207144 2483933988
conv2d_with_broadcast fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 2529610490 3633207144 1649841999
conv2d_with_broadcast fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3562503578 4021646304 3183877059 640801373
conv2d_with_broadcast fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3562503578 4021646304 3183877059 1324440001
conv2d_with_broadcast fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1144321310 4021646304 79191055 2497200625
conv2d_with_broadcast fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1144321310 4021646304 79191055 4215716431
conv2d_with_broadcast fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3153402236 2244058322 751167457 2006726432
conv2d_with_broadcast fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3153402236 2244058322 751167457 111060226
conv2d_with_broadcast fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 803435641
conv2d_with_broadcast fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 1867934544
conv2d_with_broadcast fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 1900794023
conv2d_with_broadcast fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 3680542634
conv2d_with_broadcast fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4047780986 3796154296 1508665058 4120442081
conv2d_with_broadcast fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4047780986 3796154296 1508665058 2603142772
conv2d_with_broadcast fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4196208609 640419443 1000858800 1782212700
conv2d_with_broadcast fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4196208609 640419443 1000858800 3786504077
conv2d_with_broadcast fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1494714374 785253250 1035710906 607193837
conv2d_with_broadcast fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1494714374 785253250 1035710906 1133996987
conv2d_with_broadcast fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4104811786 417350231 2732854425 3257806996
conv2d_with_broadcast fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4104811786 417350231 2732854425 3964495721
conv2d_with_broadcast fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3747780903 2173099720 1359872451 260513555
conv2d_with_broadcast fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3747780903 2173099720 1359872451 959940766
conv2d_with_broadcast fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1007447386 3633207144 3338848009
conv2d_with_broadcast fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1007447386 3633207144 3338848009
conv2d_with_broadcast fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 7870409 1884736347 2440609834
conv2d_with_broadcast fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 7870409 1884736347 2440609834
conv2d_with_broadcast fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 2912193732 1884736347 616776505
conv2d_with_broadcast fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 2912193732 1884736347 2676398591
conv2d_with_broadcast fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 1007447386 1884736347 2365143548
conv2d_with_broadcast fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 1007447386 1884736347 2365143548
conv2d_with_broadcast fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3832095556 1694475665 593280269
conv2d_with_broadcast fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3832095556 1694475665 593280269
conv2d_with_broadcast fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3855174680 715002355 3155431044
conv2d_with_broadcast fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3855174680 715002355 3155431044
conv2d_with_broadcast fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 2822482016 715002355 2715024840
conv2d_with_broadcast fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 2822482016 715002355 1827980477
conv2d_with_broadcast fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 223404009 1694475665 1950498144
conv2d_with_broadcast fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 223404009 1694475665 1950498144
conv2d_with_broadcast fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 223404009 715002355 2992665436
conv2d_with_broadcast fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 223404009 715002355 2992665436
conv2d_with_broadcast fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 887849976 1884736347 737409599
conv2d_with_broadcast fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 887849976 1884736347 737409599
conv2d_with_broadcast fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 3832095556 1159201466 1807823289
conv2d_with_broadcast fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 3832095556 1159201466 1807823289
conv2d_with_broadcast fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 417350231 1159201466 2790858874
conv2d_with_broadcast fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 417350231 1159201466 1803950909
conv2d_with_broadcast fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 3796154296 1884736347 2211230337
conv2d_with_broadcast fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 3796154296 1884736347 2211230337
conv2d_with_broadcast fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 3796154296 1159201466 1707831674
conv2d_with_broadcast fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 3796154296 1159201466 1707831674
conv2d_with_broadcast fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1168268462 715002355 3410506082
conv2d_with_broadcast fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1168268462 715002355 3410506082
conv2d_with_broadcast fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 887849976 760086468 3430817166
conv2d_with_broadcast fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 887849976 760086468 3430817166
conv2d_with_broadcast fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 718873845 760086468 4057506865
conv2d_with_broadcast fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 718873845 760086468 1139160912
conv2d_with_broadcast fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 1971906017 715002355 3080563386
conv2d_with_broadcast fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 1971906017 715002355 3080563386
conv2d_with_broadcast fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 1971906017 760086468 1857427510
conv2d_with_broadcast fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 1971906017 760086468 1857427510
conv2d_with_broadcast fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2475183841 2416021807 2396614489 2728011042
conv2d_with_broadcast fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2475183841 2416021807 2396614489 48736270
conv2d_with_broadcast fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 835429033 3252222904 812624363 3532893716
conv2d_with_broadcast fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 835429033 3252222904 812624363 385208528
conv2d_with_broadcast fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_hnhwc_f_f 83915378 2330495260 877009950 1683572655
conv2d_with_reduction fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 542905940 1152388039 4158385867 734550470
conv2d_with_reduction fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 542905940 1152388039 4158385867 734550470
conv2d_with_reduction fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1585175937 2411745115 3960856459 2498726848
conv2d_with_reduction fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1585175937 2411745115 3960856459 2808936497
conv2d_with_reduction fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2793112873 4021016722 3736889909 775549951
conv2d_with_reduction fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2793112873 4021016722 3736889909 999245167
conv2d_with_reduction fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3892602751 3987447721 1048231784 3578965759
conv2d_with_reduction fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3892602751 3987447721 1048231784 3635477992
conv2d_with_reduction fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1647798936 1986983586 2046300236 942258126
conv2d_with_reduction fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1647798936 1986983586 2046300236 3024889990
conv2d_with_reduction fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 3844983048 1063165266 1754355425
conv2d_with_reduction fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 3844983048 1063165266 3524504078
conv2d_with_reduction fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 741820436 4160104467 1904546220
conv2d_with_reduction fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 741820436 4160104467 3380363267
conv2d_with_reduction fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 2188679282 2508923337 202634559
conv2d_with_reduction fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 664571366 2188679282 2508923337 129526502
conv2d_with_reduction fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 1152388039 3960856459 687707885
conv2d_with_reduction fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 1152388039 3960856459 687707885
conv2d_with_reduction fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 4021016722 3960856459 551076377
conv2d_with_reduction fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3376807219 4021016722 3960856459 2736700182
conv2d_with_reduction fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3708184432 1152388039 3736889909 3070080445
conv2d_with_reduction fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3708184432 1152388039 3736889909 3070080445
conv2d_with_reduction fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3793481427 2784674253 206323080 4139449287
conv2d_with_reduction fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3793481427 2784674253 206323080 37247821
conv2d_with_reduction fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 724504571 866495443 4160104467 4166513007
conv2d_with_reduction fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 724504571 866495443 4160104467 4147817279
conv2d_with_reduction fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3696992523 2499748007 798339031 2425875414
conv2d_with_reduction fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3696992523 2499748007 798339031 3318636886
conv2d_with_reduction fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3999848747 2499748007 3897780943 1663875047
conv2d_with_reduction fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3999848747 2499748007 3897780943 433625993
conv2d_with_reduction fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1193090006 2131084833 1626339432 2602241257
conv2d_with_reduction fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1193090006 2131084833 1626339432 2541313003
conv2d_with_reduction fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3123356211 67170595 363851176 2694787359
conv2d_with_reduction fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3123356211 67170595 363851176 2694787359
conv2d_with_reduction fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 374093114 3867270480 3627748989 1042228997
conv2d_with_reduction fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 374093114 3867270480 3627748989 2764787715
conv2d_with_reduction fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3983093985 3903005020 2973635008 4245228167
conv2d_with_reduction fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3983093985 3903005020 2973635008 2011478650
conv2d_with_reduction fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3167361585 764195688 1462303962 1213873906
conv2d_with_reduction fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3167361585 764195688 1462303962 3997555577
conv2d_with_reduction fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2514717945 2683853778 864525589 2026195616
conv2d_with_reduction fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2514717945 2683853778 864525589 1429180818
conv2d_with_reduction fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1072544153 768805504 2851440397 1223626417
conv2d_with_reduction fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1072544153 768805504 2851440397 4064809744
conv2d_with_reduction fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3875284691 1195875134 1294114950 3478825820
conv2d_with_reduction fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3875284691 1195875134 1294114950 2402092772
conv2d_with_reduction fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3179965682 1961598694 1473372001 2976087551
conv2d_with_reduction fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3179965682 1961598694 1473372001 2952357814
conv2d_with_reduction fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2615784276 3832095556 3136842101 4100457990
conv2d_with_reduction fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2615784276 3832095556 3136842101 4100457990
conv2d_with_reduction fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 674692187 808380753 3300005124 3291766543
conv2d_with_reduction fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 674692187 808380753 3300005124 932781825
conv2d_with_reduction fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 2529610490 3633207144 2483933988
conv2d_with_reduction fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 2529610490 3633207144 1649841999
conv2d_with_reduction fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3562503578 4021646304 3183877059 640801373
conv2d_with_reduction fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3562503578 4021646304 3183877059 1324440001
conv2d_with_reduction fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1144321310 4021646304 79191055 2497200625
conv2d_with_reduction fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1144321310 4021646304 79191055 4215716431
conv2d_with_reduction fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3153402236 2244058322 751167457 2006726432
conv2d_with_reduction fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3153402236 2244058322 751167457 111060226
conv2d_with_reduction fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 803435641
conv2d_with_reduction fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 1867934544
conv2d_with_reduction fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 1900794023
conv2d_with_reduction fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3356996599 4021646304 625876979 3680542634
conv2d_with_reduction fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4047780986 3796154296 1508665058 4120442081
conv2d_with_reduction fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4047780986 3796154296 1508665058 2603142772
conv2d_with_reduction fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4196208609 640419443 1000858800 1782212700
conv2d_with_reduction fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4196208609 640419443 1000858800 3786504077
conv2d_with_reduction fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1494714374 785253250 1035710906 607193837
conv2d_with_reduction fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1494714374 785253250 1035710906 1133996987
conv2d_with_reduction fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4104811786 417350231 2732854425 3257806996
conv2d_with_reduction fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4104811786 417350231 2732854425 3964495721
conv2d_with_reduction fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3747780903 2173099720 1359872451 260513555
conv2d_with_reduction fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3747780903 2173099720 1359872451 959940766
conv2d_with_reduction fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1007447386 3633207144 3338848009
conv2d_with_reduction fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1007447386 3633207144 3338848009
conv2d_with_reduction fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 7870409 1884736347 2440609834
conv2d_with_reduction fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 7870409 1884736347 2440609834
conv2d_with_reduction fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 2912193732 1884736347 616776505
conv2d_with_reduction fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 2912193732 1884736347 2676398591
conv2d_with_reduction fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 1007447386 1884736347 2365143548
conv2d_with_reduction fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 1007447386 1884736347 2365143548
conv2d_with_reduction fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3832095556 1694475665 593280269
conv2d_with_reduction fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3832095556 1694475665 593280269
conv2d_with_reduction fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3855174680 715002355 3155431044
conv2d_with_reduction fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 3557673531 3855174680 715002355 3155431044
conv2d_with_reduction fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 2822482016 715002355 2715024840
conv2d_with_reduction fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 2822482016 715002355 1827980477
conv2d_with_reduction fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 223404009 1694475665 1950498144
conv2d_with_reduction fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 223404009 1694475665 1950498144
conv2d_with_reduction fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 223404009 715002355 2992665436
conv2d_with_reduction fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 223404009 715002355 2992665436
conv2d_with_reduction fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 887849976 1884736347 737409599
conv2d_with_reduction fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 887849976 1884736347 737409599
conv2d_with_reduction fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 3832095556 1159201466 1807823289
conv2d_with_reduction fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 961566038 3832095556 1159201466 1807823289
conv2d_with_reduction fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 417350231 1159201466 2790858874
conv2d_with_reduction fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 417350231 1159201466 1803950909
conv2d_with_reduction fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 3796154296 1884736347 2211230337
conv2d_with_reduction fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2111106579 3796154296 1884736347 2211230337
conv2d_with_reduction fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 3796154296 1159201466 1707831674
conv2d_with_reduction fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 3796154296 1159201466 1707831674
conv2d_with_reduction fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1168268462 715002355 3410506082
conv2d_with_reduction fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 1168268462 715002355 3410506082
conv2d_with_reduction fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 887849976 760086468 3430817166
conv2d_with_reduction fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 1421336162 887849976 760086468 3430817166
conv2d_with_reduction fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 718873845 760086468 4057506865
conv2d_with_reduction fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 718873845 760086468 1139160912
conv2d_with_reduction fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 1971906017 715002355 3080563386
conv2d_with_reduction fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2237641409 1971906017 715002355 3080563386
conv2d_with_reduction fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 1971906017 760086468 1857427510
conv2d_with_reduction fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 4108139691 1971906017 760086468 1857427510
conv2d_with_reduction fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2475183841 2416021807 2396614489 2728011042
conv2d_with_reduction fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 2475183841 2416021807 2396614489 48736270
conv2d_with_reduction fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 835429033 3252222904 812624363 3532893716
conv2d_with_reduction fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_hnhwc_f_f 835429033 3252222904 812624363 385208528
conv2d_with_reduction fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_hnhwc_f_f 83915378 2330495260 877009950 1683572655
conv3d wgrad_1x1x3x3x8_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 260402488 3429884614 1585402383 833795101
conv3d wgrad_1x1x3x3x8_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 260402488 3429884614 1585402383 833795101
conv3d wgrad_1x1x1x8x8_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 3289763692 3767246007 1919973277 3027845106
conv3d wgrad_1x1x1x8x8_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 3289763692 3767246007 1919973277 3438501812
conv3d wgrad_1x8x8x8x8_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2160711118 237996982 3097125139 3385458653
conv3d wgrad_1x8x8x8x8_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2160711118 237996982 3097125139 4067030004
conv3d wgrad_1x16x16x16x8_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3097125139 2362430426
conv3d wgrad_1x16x16x16x8_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3097125139 232096215
conv3d wgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2925080861 1932218676 4010744414 1482409913
conv3d wgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2925080861 1932218676 4010744414 3679067567
conv3d wgrad_1x2x1x1x8_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2490670429 1753332435 375701898 2590121240
conv3d wgrad_1x2x1x1x8_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2490670429 1753332435 375701898 1128734185
conv3d wgrad_1x1x7x7x8_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2588182096 66500551 2381193183 2086127414
conv3d wgrad_1x1x7x7x8_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2588182096 66500551 2381193183 1043269053
conv3d wgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2938214523 2512139560 1761528323 1783334553
conv3d wgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2938214523 2512139560 1761528323 1179670460
conv3d wgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 2455664422 3608965793 765434198
conv3d wgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 2455664422 3608965793 188802405
conv3d wgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 790945652 2636428043 693887212
conv3d wgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 790945652 2636428043 384409630
conv3d wgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 790945652 843165254 3460165373
conv3d wgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 790945652 843165254 3773819495
conv3d wgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3823648244 533514635
conv3d wgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3823648244 1741504291
conv3d wgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 2117188192 2396130566 737907007
conv3d wgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 2117188192 2396130566 2545563286
conv3d wgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 1323666964 3626031696 399985743
conv3d wgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 1323666964 3626031696 2555400535
conv3d wgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 2017705694 3626031696 2729880203
conv3d wgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 2017705694 3626031696 2506274387
conv3d wgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2070552692 3823648244 244959174
conv3d wgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2070552692 3823648244 488179326
conv3d wgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2455664422 357908110 1536430798
conv3d wgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2455664422 357908110 943604539
conv3d wgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 790945652 4105258568 2484072263
conv3d wgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 790945652 4105258568 1264798027
conv3d wgrad_1x8x8x8x32_66x6_32x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha2_beta2 hndhwc_hndhwc_fndhwc_f_f 3757300649 1729998821 2636428043 857756936

View File

@ -0,0 +1,283 @@
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1152388039 486967919 3706990238
conv2d fprop_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1152388039 486967919 3706990238
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1585175937 2411745115 1919973277 506127908
conv2d fprop_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1585175937 2411745115 1919973277 2193864160
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 3872812830
conv2d fprop_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2445012180
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3892602751 3987447721 2963892063 3556328678
conv2d fprop_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3892602751 3987447721 2963892063 2088376980
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1647798936 1986983586 3862463878 498933688
conv2d fprop_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1647798936 1986983586 3862463878 2581533408
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 3844983048 373331791 3515334098
conv2d fprop_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 3844983048 373331791 2566159340
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 741820436 2695215306 4235633178
conv2d fprop_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 741820436 2695215306 815310604
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 2188679282 2132201986 1043483661
conv2d fprop_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 664571366 2188679282 2132201986 2172013863
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 1152388039 1919973277 1836150764
conv2d fprop_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 1152388039 1919973277 1836150764
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 4021016722 1919973277 3537245111
conv2d fprop_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3376807219 4021016722 1919973277 1166347001
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3708184432 1152388039 1911021900 4188669650
conv2d fprop_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3708184432 1152388039 1911021900 4188669650
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3793481427 2784674253 5067603 3709403009
conv2d fprop_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3793481427 2784674253 5067603 3666537740
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 724504571 866495443 2695215306 2273666993
conv2d fprop_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 724504571 866495443 2695215306 3277012289
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3696992523 2499748007 2381193183 4256475381
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3696992523 2499748007 2381193183 868016148
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3999848747 2499748007 1038140209 3720347250
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3999848747 2499748007 1038140209 3079806253
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1193090006 2131084833 720746870 1441382904
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1193090006 2131084833 720746870 2400159337
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3123356211 67170595 2290618404 1832291434
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3123356211 67170595 2290618404 1832291434
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 374093114 3867270480 2959096809 3957922181
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 374093114 3867270480 2959096809 855145836
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3983093985 3903005020 613201518 1067564721
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3983093985 3903005020 613201518 3116342099
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3167361585 764195688 167104692 3451521719
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3167361585 764195688 167104692 2267030515
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2514717945 2683853778 2557576548 3978291544
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2514717945 2683853778 2557576548 2608287914
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1072544153 768805504 1993107524 2984226313
conv2d fprop_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1072544153 768805504 1993107524 3008259681
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3875284691 1195875134 1041989393 1900995663
conv2d fprop_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3875284691 1195875134 1041989393 392783151
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3179965682 1961598694 1222599802 2151043714
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3179965682 1961598694 1222599802 1013916354
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2615784276 3832095556 1454859747 958765281
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2615784276 3832095556 1454859747 958765281
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 674692187 808380753 1933240382 879488563
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 674692187 808380753 1933240382 1399508988
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 961566038 2529610490 1966904362 1818870269
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 961566038 2529610490 1966904362 2484388308
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3562503578 4021646304 3426919182 4130346493
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3562503578 4021646304 3426919182 3486420438
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1144321310 4021646304 4185476157 964986272
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1144321310 4021646304 4185476157 1800819557
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3153402236 2244058322 623381239 4197612113
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3153402236 2244058322 623381239 2816226027
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 438913488
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 2812015344
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 307241203
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3356996599 4021646304 748585111 3413043496
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4047780986 3796154296 3933470176 2042558105
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4047780986 3796154296 3933470176 2082898655
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4196208609 640419443 3879567407 3126196765
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4196208609 640419443 3879567407 370340580
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1494714374 785253250 1954437668 16145912
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1494714374 785253250 1954437668 352471766
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4104811786 417350231 2268084635 3829320356
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4104811786 417350231 2268084635 3317921115
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3747780903 2173099720 1217977439 3831700802
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3747780903 2173099720 1217977439 2066501805
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2475183841 2416021807 90427526 3879607464
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2475183841 2416021807 90427526 3914420497
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 835429033 3252222904 934864596 2610068735
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 835429033 3252222904 934864596 4160630405
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 83915378 2330495260 722450442 220865236
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 1152388039 1036082506 2004021933
conv2d dgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 1152388039 1036082506 2004021933
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 2411745115 1585402383 692064357
conv2d dgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 2411745115 1585402383 3191762167
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2493803192
conv2d dgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 4021016722 1911021900 2915688271
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3987447721 311726682 356690874
conv2d dgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3987447721 311726682 3600277581
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 1986983586 1898068767 1480022038
conv2d dgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 1986983586 1898068767 1482170634
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 3844983048 3628298618 1684782062
conv2d dgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 3844983048 3628298618 1312771437
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 741820436 3628298618 3927854537
conv2d dgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 741820436 3628298618 3753859236
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 2188679282 3628298618 331956491
conv2d dgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 2188679282 3628298618 3514953364
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 67170595 1307969125 1500995359
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 67170595 1307969125 1500995359
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 3903005020 1541598000 4224357357
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 3903005020 1541598000 1962390570
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 764195688 2813830197 3377586111
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 764195688 2813830197 1315372741
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 2683853778 2983167436 324191835
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 2683853778 2983167436 1085373547
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 768805504 3823519277 1916712483
conv2d dgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 768805504 3823519277 1584393587
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 1195875134 2636428043 1173364286
conv2d dgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 1195875134 2636428043 4109782860
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 785253250 2351024902 3316943078
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 785253250 2351024902 1065622134
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 417350231 2574042419 294608043
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 417350231 2574042419 491435109
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 2173099720 3438778114 3788164138
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 2173099720 3438778114 2104210385
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 2416021807 2145192778 2640510765
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 2416021807 2145192778 2748647248
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3252222904 535024815 169162784
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3252222904 535024815 3841086721
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 2329920945 2330495260 1682007569 215965178
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 3282100285 1585402383 820104967
conv2d wgrad_1x1x1x8_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 558763846 3282100285 1585402383 820104967
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 1919973277 4103626856
conv2d wgrad_1x1x8x8_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 1919973277 4164492975
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 2527774459 2695215306 1519678771
conv2d wgrad_1x7x8x8_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 2527774459 2695215306 4056436284
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3488761154 1737428004 2359527095
conv2d wgrad_1x7x9x8_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 390767101 3488761154 1737428004 2240340004
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 2242491745 475190714 3363555017
conv2d wgrad_2x7x9x8_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2346452629 2242491745 475190714 2240937477
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 1231166805 3030543492 1587793687
conv2d wgrad_3x7x9x8_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 695385844 1231166805 3030543492 4129044530
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 1231166805 3002932066 1436246794
conv2d wgrad_3x7x9x8_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 1231166805 3002932066 2860692730
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 1231166805 2704246666 3831504826
conv2d wgrad_3x7x9x8_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2078642274 1231166805 2704246666 932276705
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 1585402383 584217576
conv2d wgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 1585402383 584217576
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 2695215306 644274899
conv2d wgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 3952246738 2695215306 2070383610
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 3269716347 1585402383 2091838742
conv2d wgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 3269716347 1585402383 2091838742
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2208297031 3036494114 1391639360
conv2d wgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2208297031 3036494114 2853291206
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 3638907161 2381193183 4076043307
conv2d wgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 3638907161 2381193183 162466399
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 1748311260 3097125139 1760368998
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 1748311260 3097125139 370487040
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 950177617 3097125139 2441672462
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 950177617 3097125139 4093130692
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 3223936144 3268227320 3407045986
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 3223936144 3268227320 3327506975
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 2413111238 4020828414 3782469663
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1371340519 2413111238 4020828414 3782469663
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 1849062825 2621782130 1997835815
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 1849062825 2621782130 2176605786
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 1028019427 3062073018 1532225578
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2815270590 1028019427 3062073018 3175924537
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 665408258 4119019906 3070068838
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2371881721 665408258 4119019906 4095170522
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 1329921014 2730633195 1859011130
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2314925659 1329921014 2730633195 1829382848
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 654394569 180842421 456267566
conv2d wgrad_1x15x19x40_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1327011661 654394569 180842421 4065629708
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 792561864 3949436648 2346117136
conv2d wgrad_1x16x24x72_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2223985070 792561864 3949436648 3375703263
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 2182213461 3596813277 2680766255
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 2182213461 3596813277 819444109
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 4284293314 3730143675 2330242371
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 4284293314 3730143675 2330242371
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 1488124595 3162712336 2186928678
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 1488124595 3162712336 4038147074
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 1324698024 1813717058 1491574211
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 1324698024 1813717058 664642450
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 1617738198 2081693980 1691976762
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 1617738198 2081693980 1352928468
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 169231440 2081693980 4154079864
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 169231440 2081693980 49240552
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 1111691860 1000406280 1708014479
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 1111691860 1000406280 2976393539
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 141423768
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 1807012226
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 4065587708
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 3782006390 2081693980 3621154478
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 4018387624 2099843274 3166971951
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 4018387624 2099843274 710495809
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 1007447386 3357056235 3446932548
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 1007447386 3357056235 344178277
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 4040055257 852881505 1633246355
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2519843766 4040055257 852881505 778858244
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 428926092 1217669626 1090782686
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4232110637 428926092 1217669626 1523455590
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 1787889194 2989357662 3134613422
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3630316758 1787889194 2989357662 1158845444
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 857847029 3333097025 3239572160
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 866609547 857847029 3333097025 2436320376
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3294874067 3443985888 4083335585
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2538496988 3294874067 3443985888 3302917564
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 2329920945 531242570 422976060 2227466455
conv2d wgrad_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 2411745115 1138813722 1312614816
conv2d wgrad_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 2411745115 1138813722 4095449788
conv2d dgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 2564029204 3847371704
conv2d dgrad_1x11x7x8_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 1152388039 2564029204 3847371704
conv2d dgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 4021016722 2564029204 2275490218
conv2d dgrad_1x11x7x8_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2125023038 4021016722 2564029204 2132854116
conv2d dgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 1152388039 1676221042 3084298807
conv2d dgrad_1x13x11x8_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2793112873 1152388039 1676221042 3084298807
conv2d dgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2784674253 191365871 3758840577
conv2d dgrad_1x17x19x8_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 624119942 2784674253 191365871 201424948
conv2d dgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 866495443 4038686961 1705939247
conv2d dgrad_1x23x5x8_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 118714643 866495443 4038686961 2657530738
conv2d dgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 2499748007 688732356 3362895769
conv2d dgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3912955093 2499748007 688732356 4133050271
conv2d dgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 2499748007 3810393490 1868454698
conv2d dgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2380180646 2499748007 3810393490 4121127243
conv2d dgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 2131084833 2598385656 2382857802
conv2d dgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4197955097 2131084833 2598385656 3397661960
conv2d dgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 3867270480 2925287275 2208597029
conv2d dgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 4064585156 3867270480 2925287275 2274812992
conv2d dgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 1961598694 1379168514 1077915308
conv2d dgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1663038387 1961598694 1379168514 397243715
conv2d dgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 3832095556 2917865891 4107392040
conv2d dgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2518156720 3832095556 2917865891 4107392040
conv2d dgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 808380753 3243383160 254649230
conv2d dgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1153452126 808380753 3243383160 1326012988
conv2d dgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 2529610490 78092922 937037280
conv2d dgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3557673531 2529610490 78092922 1858025388
conv2d dgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 4021646304 2515450069 981269351
conv2d dgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3373735934 4021646304 2515450069 1054201594
conv2d dgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 4021646304 2499255921 2519894620
conv2d dgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 1883441731 4021646304 2499255921 779628000
conv2d dgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 2244058322 2208482181 1483418711
conv2d dgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2212544074 2244058322 2208482181 4167030585
conv2d dgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 4021646304 3459396734 456980924
conv2d dgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 4021646304 3459396734 2013696151
conv2d dgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 4021646304 3459396734 3583381428
conv2d dgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 841696772 4021646304 3459396734 3556307685
conv2d dgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 3796154296 4084859749 2972648305
conv2d dgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3869576724 3796154296 4084859749 2483086888
conv2d dgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 640419443 843165254 729442897
conv2d dgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 2106265431 640419443 843165254 1567894631
conv2d dgrad_1x56x56x8_28x28_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha2_beta2 hnhwc_hnhwc_fnhwc_f_f 3092573237 1152388039 1813717058 3398247359
conv2d dgrad_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1189071464 1919973277 257167289
conv2d dgrad_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 542905940 1189071464 1919973277 419044577
conv2d dgrad_1x56x56x12_28x28_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3092573237 1046014840 3129171903 3024531293
conv2d dgrad_1x56x56x12_28x28_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3092573237 1046014840 3129171903 3024531293
conv2d dgrad_1x55x55x12_28x28_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3092573237 1046014840 1050854832 1177039304
conv2d dgrad_1x55x55x12_28x28_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 hnhwc_hnhwc_fnhwc_f_f 3092573237 1046014840 1050854832 1177039304
conv3d wgrad_1x1x3x3x8_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 260402488 3429884614 1585402383 833795101
conv3d wgrad_1x1x3x3x8_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 260402488 3429884614 1585402383 833795101
conv3d wgrad_1x1x1x8x8_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 3289763692 3767246007 1919973277 3027845106
conv3d wgrad_1x1x1x8x8_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 3289763692 3767246007 1919973277 3438501812
conv3d wgrad_1x8x8x8x8_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2160711118 237996982 3097125139 3385458653
conv3d wgrad_1x8x8x8x8_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2160711118 237996982 3097125139 4067030004
conv3d wgrad_1x16x16x16x8_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3097125139 2362430426
conv3d wgrad_1x16x16x16x8_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3097125139 232096215
conv3d wgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2925080861 1932218676 4010744414 1482409913
conv3d wgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2925080861 1932218676 4010744414 3679067567
conv3d wgrad_1x2x1x1x8_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2490670429 1753332435 375701898 2590121240
conv3d wgrad_1x2x1x1x8_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2490670429 1753332435 375701898 1128734185
conv3d wgrad_1x1x7x7x8_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2588182096 66500551 2381193183 2086127414
conv3d wgrad_1x1x7x7x8_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2588182096 66500551 2381193183 1043269053
conv3d wgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2938214523 2512139560 1761528323 1783334553
conv3d wgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 2938214523 2512139560 1761528323 1179670460
conv3d wgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 2455664422 3608965793 765434198
conv3d wgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 2455664422 3608965793 188802405
conv3d wgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 790945652 2636428043 693887212
conv3d wgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 795080053 790945652 2636428043 384409630
conv3d wgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 790945652 843165254 3460165373
conv3d wgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 790945652 843165254 3773819495
conv3d wgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3823648244 533514635
conv3d wgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 4101517777 2117188192 3823648244 1741504291
conv3d wgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 2117188192 2396130566 737907007
conv3d wgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 2117188192 2396130566 2545563286
conv3d wgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 1323666964 3626031696 399985743
conv3d wgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1247243134 1323666964 3626031696 2555400535
conv3d wgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 2017705694 3626031696 2729880203
conv3d wgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 2017705694 3626031696 2506274387
conv3d wgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2070552692 3823648244 244959174
conv3d wgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2070552692 3823648244 488179326
conv3d wgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2455664422 357908110 1536430798
conv3d wgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 1092746437 2455664422 357908110 943604539
conv3d wgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 790945652 4105258568 2484072263
conv3d wgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 hndhwc_hndhwc_fndhwc_f_f 796662877 790945652 4105258568 1264798027
conv3d wgrad_1x8x8x8x32_66x6_32x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha2_beta2 hndhwc_hndhwc_fndhwc_f_f 3757300649 1729998821 2636428043 857756936

View File

@ -0,0 +1,310 @@
conv2d fprop_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3717255578 1782345730 486967919 3628559084
conv2d fprop_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3717255578 1782345730 486967919 3628559084
conv2d fprop_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1438136294 118775326 1919973277 3060288390
conv2d fprop_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1438136294 118775326 1919973277 2970039207
conv2d fprop_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2098961808 3028917290 1911021900 2231724975
conv2d fprop_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2098961808 3028917290 1911021900 32368867
conv2d fprop_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2965017607 403875147 2963892063 3617758931
conv2d fprop_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2965017607 403875147 2963892063 1213867461
conv2d fprop_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 667266590 2406505019 3862463878 1032157693
conv2d fprop_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 667266590 2406505019 3862463878 2512484574
conv2d fprop_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2475006452 3635815590 373331791 156090483
conv2d fprop_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2475006452 3635815590 373331791 2125643627
conv2d fprop_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2475006452 511925094 2695215306 1183833128
conv2d fprop_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2475006452 511925094 2695215306 950863078
conv2d fprop_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2475006452 2496949223 2132201986 1645211922
conv2d fprop_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2475006452 2496949223 2132201986 888922489
conv2d fprop_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 997827848 1782345730 1919973277 3242947060
conv2d fprop_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 997827848 1782345730 1919973277 3242947060
conv2d fprop_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 997827848 3028917290 1919973277 2570877648
conv2d fprop_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 997827848 3028917290 1919973277 3601912269
conv2d fprop_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2114904520 1782345730 1911021900 1777629475
conv2d fprop_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2114904520 1782345730 1911021900 1777629475
conv2d fprop_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2323582907 3813900300 5067603 2056042422
conv2d fprop_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2323582907 3813900300 5067603 3581028648
conv2d fprop_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2541524845 3272268888 2695215306 1284148249
conv2d fprop_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2541524845 3272268888 2695215306 529645467
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 185683981 2918738410 2381193183 3146807750
conv2d fprop_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 185683981 2918738410 2381193183 3919362272
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 588375524 2918738410 1038140209 2259020777
conv2d fprop_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 588375524 2918738410 1038140209 2073872618
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 637528927 1554396804 720746870 2382111738
conv2d fprop_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 637528927 1554396804 720746870 1697335701
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 867397053 1472739692 2290618404 3626933660
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 867397053 1472739692 2290618404 3626933660
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3560734409 796697554 2959096809 3337392869
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3560734409 796697554 2959096809 1465273757
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 613937219 2493469875 613201518 2545095524
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 613937219 2493469875 613201518 119102005
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3361618670 3613518632 167104692 2075508652
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3361618670 3613518632 167104692 249956416
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2077916351 2183908250 2557576548 825424571
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2077916351 2183908250 2557576548 3723250582
conv2d fprop_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3337465330 687027832 1993107524 3917445532
conv2d fprop_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3337465330 687027832 1993107524 723144309
conv2d fprop_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2259030042 474618004 1041989393 4007092054
conv2d fprop_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2259030042 474618004 1041989393 121750431
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 698239287 1381476450 1222599802 2705358355
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 698239287 1381476450 1222599802 1921082534
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3178095839 69226238 1454859747 2429064071
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3178095839 69226238 1454859747 2429064071
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1986322298 2695937708 1933240382 258792262
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1986322298 2695937708 1933240382 1350961289
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3975148258 1880796449 1966904362 2674132654
conv2d fprop_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3975148258 1880796449 1966904362 4061823028
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 864161797 2648936894 3426919182 1513280885
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 864161797 2648936894 3426919182 3304279324
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3665852514 2648936894 4185476157 1062588307
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3665852514 2648936894 4185476157 1737400068
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1720566144 613651087 623381239 3456180201
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1720566144 613651087 623381239 612510019
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3148446926 2648936894 748585111 1918078890
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3148446926 2648936894 748585111 1296506717
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3148446926 2648936894 748585111 720321141
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3148446926 2648936894 748585111 2250020808
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3133916250 3595579175 3933470176 1216324411
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3133916250 3595579175 3933470176 1337638334
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 647896480 614033835 3879567407 2187352956
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 647896480 614033835 3879567407 3505172898
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1692261965 2681206785 1954437668 3275330607
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1692261965 2681206785 1954437668 3211342413
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 5417052 782710099 2268084635 2574304052
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 5417052 782710099 2268084635 959147198
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 81064849 3635880243 1217977439 1759317211
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 81064849 3635880243 1217977439 3077847987
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1369732128 3852936634 90427526 1404446496
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1369732128 3852936634 90427526 4261451781
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1636922998 3114239439 934864596 1375658938
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1636922998 3114239439 934864596 90410819
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 tf32nhwc_tf32nhwc_fnhwc_f_f 2874774314 3318673787 722450442 726679987
conv2d fprop_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 3518807763 1036082506 3048105666
conv2d fprop_1x4x4x12_1x1_8x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 3518807763 1036082506 3968624793
conv2d dgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1544571845 1782345730 3890556343 3840696830
conv2d dgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1544571845 1782345730 3890556343 3840696830
conv2d dgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 118775326 2980124304 2572054323
conv2d dgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 118775326 2980124304 4006425566
conv2d dgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3304381737 3028917290 802623080 1655787066
conv2d dgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3304381737 3028917290 802623080 2956350850
conv2d dgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2123037179 403875147 2738672641 962312341
conv2d dgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2123037179 403875147 2738672641 3126435132
conv2d dgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2220887882 2406505019 311726682 4061102478
conv2d dgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2220887882 2406505019 311726682 2314369199
conv2d dgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3209955145 3635815590 1146816700 3996872848
conv2d dgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3209955145 3635815590 1146816700 2269688958
conv2d dgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3007342694 511925094 1146816700 1719436727
conv2d dgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3007342694 511925094 1146816700 4236972782
conv2d dgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3553706784 2496949223 1146816700 1307853167
conv2d dgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3553706784 2496949223 1146816700 469937848
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1430474811 1472739692 1307969125 2041137857
conv2d dgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1430474811 1472739692 1307969125 2041137857
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1394549732 2493469875 1541598000 562462849
conv2d dgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1394549732 2493469875 1541598000 585918261
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 136395274 3613518632 2813830197 3551637995
conv2d dgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 136395274 3613518632 2813830197 2284323213
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 176279613 2183908250 2983167436 866644788
conv2d dgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 176279613 2183908250 2983167436 253066315
conv2d dgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 4065225089 687027832 1092494080 274183605
conv2d dgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 4065225089 687027832 1092494080 1241514327
conv2d dgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3973136713 474618004 3541920582 2018009151
conv2d dgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3973136713 474618004 3541920582 1303918704
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3059307623 2681206785 2351024902 941952011
conv2d dgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3059307623 2681206785 2351024902 3577527602
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1541852759 782710099 2574042419 2518679986
conv2d dgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1541852759 782710099 2574042419 3797768014
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 310867128 3635880243 3438778114 508409341
conv2d dgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 310867128 3635880243 3438778114 3918768286
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1053420568 3852936634 2145192778 3649177283
conv2d dgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1053420568 3852936634 2145192778 2392118609
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 822175023 3114239439 535024815 4039199216
conv2d dgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 822175023 3114239439 535024815 2891577765
conv2d dgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 tf32nhwc_tf32nhwc_fnhwc_f_f 1919899681 3318673787 1682007569 2212069629
conv2d wgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1544571845 2859715967 2980124304 2169312899
conv2d wgrad_1x1x1x4_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1544571845 2859715967 2980124304 2169312899
conv2d wgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 1782345730 294738383 1067638259
conv2d wgrad_1x1x8x4_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 1782345730 294738383 504959928
conv2d wgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3304381737 4201241820 1588130777 587511439
conv2d wgrad_1x7x8x4_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3304381737 4201241820 1588130777 3767308084
conv2d wgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2123037179 442597470 3036494114 4124366680
conv2d wgrad_1x7x9x4_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2123037179 442597470 3036494114 2833785422
conv2d wgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2220887882 347064917 1239438433 1775116239
conv2d wgrad_2x7x9x4_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2220887882 347064917 1239438433 1288542483
conv2d wgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3209955145 3544266385 4207987780 4054255409
conv2d wgrad_3x7x9x4_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3209955145 3544266385 4207987780 180834054
conv2d wgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3007342694 3544266385 2381193183 353843599
conv2d wgrad_3x7x9x4_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3007342694 3544266385 2381193183 1860329513
conv2d wgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3553706784 3544266385 2224388272 347055977
conv2d wgrad_3x7x9x4_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3553706784 3544266385 2224388272 994788649
conv2d wgrad_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 4212246537 2980124304 1448608264
conv2d wgrad_1x11x7x4_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 4212246537 2980124304 1448608264
conv2d wgrad_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 4212246537 1588130777 2381531672
conv2d wgrad_1x11x7x4_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 8625275 4212246537 1588130777 3417974847
conv2d wgrad_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3304381737 1617004893 2980124304 2512582600
conv2d wgrad_1x13x11x4_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3304381737 1617004893 2980124304 2512582600
conv2d wgrad_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1244986212 3239036557 3840288384 2880620663
conv2d wgrad_1x17x19x4_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1244986212 3239036557 3840288384 2552969500
conv2d wgrad_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3007342694 292469256 2695215306 3059274099
conv2d wgrad_1x23x5x4_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3007342694 292469256 2695215306 3436607346
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3748734767 1457012710 3097125139 3643918743
conv2d wgrad_1x13x17x8_6x8_24x3x3_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3748734767 1457012710 3097125139 747082267
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2635354436 2208465189 3097125139 21340657
conv2d wgrad_1x23x21x8_8x7_24x3x3_pad_h1w1_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2635354436 2208465189 3097125139 56227083
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2145197840 1160827838 3268227320 2781787969
conv2d wgrad_1x20x24x8_8x10_40x3x3_pad_h3w3_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2145197840 1160827838 3268227320 4054149767
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1430474811 1631191071 4020828414 692686929
conv2d wgrad_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1430474811 1631191071 4020828414 692686929
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3718005369 1445988057 2621782130 2833949486
conv2d wgrad_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3718005369 1445988057 2621782130 3251496823
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1394549732 268042026 3062073018 220836046
conv2d wgrad_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1394549732 268042026 3062073018 1707620502
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 136395274 3160856554 4119019906 338363935
conv2d wgrad_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 136395274 3160856554 4119019906 738717986
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 176279613 3166512658 2730633195 4275642741
conv2d wgrad_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 176279613 3166512658 2730633195 3105473059
conv2d wgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 4065225089 743025951 2871183684 1457368860
conv2d wgrad_1x15x19x36_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 4065225089 743025951 2871183684 2129608645
conv2d wgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3973136713 3690950270 995921099 1290832901
conv2d wgrad_1x16x24x68_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3973136713 3690950270 995921099 154477589
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 453168706 2270954829 3596813277 3377048584
conv2d wgrad_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 453168706 2270954829 3596813277 412509722
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2806952902 2924638290 3730143675 2712417789
conv2d wgrad_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2806952902 2924638290 3730143675 2712417789
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3121139790 3364591286 3162712336 2691220362
conv2d wgrad_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3121139790 3364591286 3162712336 3441232209
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2888814356 1897929139 1813717058 3953491679
conv2d wgrad_1x224x224x8_112x112_64x7x7_pad_h3w3_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2888814356 1897929139 1813717058 1261891081
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 610508213 451878551 2081693980 3439473075
conv2d wgrad_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 610508213 451878551 2081693980 3352279175
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 348294340 312331117 2081693980 3359165930
conv2d wgrad_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 348294340 312331117 2081693980 1942009480
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 718804073 2164859727 1000406280 332157749
conv2d wgrad_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 718804073 2164859727 1000406280 2601063004
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2287428715 1869820720 2081693980 4100031453
conv2d wgrad_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2287428715 1869820720 2081693980 1919107176
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2287428715 1869820720 2081693980 1618717912
conv2d wgrad_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2287428715 1869820720 2081693980 221251170
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 579355209 3754887563 2099843274 1752033731
conv2d wgrad_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 579355209 3754887563 2099843274 2254410747
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2276312507 1260894714 3357056235 4220059751
conv2d wgrad_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 2276312507 1260894714 3357056235 3334646036
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3059307623 562108865 852881505 1729883415
conv2d wgrad_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 3059307623 562108865 852881505 3112064590
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1541852759 341839800 1217669626 2313445327
conv2d wgrad_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1541852759 341839800 1217669626 2378687243
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 310867128 2038652539 2989357662 2523233417
conv2d wgrad_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 310867128 2038652539 2989357662 845687444
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1053420568 2110244091 3333097025 2967627788
conv2d wgrad_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 1053420568 2110244091 3333097025 285381561
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 822175023 71186875 3443985888 4252958697
conv2d wgrad_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 tf32nhwc_tf32nhwc_fnhwc_f_f 822175023 71186875 3443985888 160172027
conv2d wgrad_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 tf32nhwc_tf32nhwc_fnhwc_f_f 1919899681 1064146348 422976060 2522704893
conv3d fprop_1x1x3x3x4_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2319502486 1782345730 486967919 4136734195
conv3d fprop_1x1x3x3x4_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2319502486 1782345730 486967919 4136734195
conv3d fprop_1x1x1x8x4_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1438136294 118775326 2695215306 2927015709
conv3d fprop_1x1x1x8x4_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1438136294 118775326 2695215306 4170943443
conv3d fprop_1x8x8x8x4_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 407326717 3518807763 3608965793 698355669
conv3d fprop_1x8x8x8x4_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 407326717 3518807763 3608965793 5045356
conv3d fprop_1x16x16x16x4_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 647896480 3518807763 4105258568 4103291466
conv3d fprop_1x16x16x16x4_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 647896480 3518807763 4105258568 4029231659
conv3d fprop_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 867397053 1428724777 2090640390 1215385964
conv3d fprop_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 867397053 1428724777 2090640390 498496015
conv3d fprop_1x2x1x1x4_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 238174184 1674520437 1036082506 887717017
conv3d fprop_1x2x1x1x4_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 238174184 1674520437 1036082506 587915145
conv3d fprop_1x1x7x7x4_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3889952025 3272268888 898368197 4271884702
conv3d fprop_1x1x7x7x4_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3889952025 3272268888 898368197 3556157853
conv3d fprop_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3187517693 3677644254 281930990 1021147836
conv3d fprop_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3187517693 3677644254 281930990 3524380466
conv3d fprop_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2247510726 2370687016 3730143675 1238812141
conv3d fprop_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2247510726 2370687016 3730143675 2970038618
conv3d fprop_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 4122056936 3730143675 1023049729
conv3d fprop_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 4122056936 3730143675 109265270
conv3d fprop_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 1260894714 4105258568 1321339181
conv3d fprop_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 1260894714 4105258568 1115472017
conv3d fprop_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 3794173544 4105258568 3595166297
conv3d fprop_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 3794173544 4105258568 4158879376
conv3d fprop_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 1811285868 357908110 1351907827
conv3d fprop_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 1811285868 357908110 2935470866
conv3d fprop_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 3798825666 357908110 857966805
conv3d fprop_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 3798825666 357908110 3012212889
conv3d fprop_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 3798825666 2396130566 1514562293
conv3d fprop_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 3798825666 2396130566 186849532
conv3d fprop_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3794173544 2099843274 28708521
conv3d fprop_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3794173544 2099843274 1423759885
conv3d fprop_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2247510726 1297934566 2099843274 4045723120
conv3d fprop_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2247510726 1297934566 2099843274 3875049477
conv3d fprop_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 2962142380 2396130566 2601052002
conv3d fprop_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 2962142380 2396130566 2310738198
conv3d fprop_1x8x8x8x32_66x6_32x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha2_beta2 tf32ndhwc_tf32ndhwc_fndhwc_f_f 647896480 4122056936 925123690 251219599
conv3d dgrad_1x1x3x3x4_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1544571845 1782345730 2631899086 4172520459
conv3d dgrad_1x1x3x3x4_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1544571845 1782345730 2631899086 4172520459
conv3d dgrad_1x1x1x8x4_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3007342694 118775326 2980124304 2325666174
conv3d dgrad_1x1x1x8x4_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3007342694 118775326 2980124304 3237412583
conv3d dgrad_1x8x8x8x4_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 838246671 3518807763 852881505 655607058
conv3d dgrad_1x8x8x8x4_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 838246671 3518807763 852881505 2254239777
conv3d dgrad_1x16x16x16x4_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 3518807763 843165254 3325209335
conv3d dgrad_1x16x16x16x4_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 3518807763 843165254 2627823804
conv3d dgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1644441141 1428724777 1307969125 2400954527
conv3d dgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1644441141 1428724777 1307969125 3666407510
conv3d dgrad_1x2x1x1x4_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 238174184 1674520437 1036082506 2949975932
conv3d dgrad_1x2x1x1x4_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 238174184 1674520437 1036082506 1943004100
conv3d dgrad_1x1x7x7x4_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3595246799 3272268888 4235871427 2941526336
conv3d dgrad_1x1x7x7x4_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3595246799 3272268888 4235871427 2946859880
conv3d dgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4058682611 3677644254 1887901192 1540875533
conv3d dgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4058682611 3677644254 1887901192 2224057566
conv3d dgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 2370687016 3843555714 936632720
conv3d dgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 2370687016 3843555714 2508620825
conv3d dgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 4122056936 3730143675 1092073219
conv3d dgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 4122056936 3730143675 1665031504
conv3d dgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 1260894714 3730143675 3800549697
conv3d dgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 1260894714 3730143675 138980222
conv3d dgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 3794173544 4105258568 2796017159
conv3d dgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 3794173544 4105258568 3061070136
conv3d dgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 1811285868 4105258568 3835960274
conv3d dgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 1811285868 4105258568 1306995538
conv3d dgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 3798825666 357908110 3705914599
conv3d dgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 3798825666 357908110 4247587642
conv3d dgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 3798825666 2396130566 4140791836
conv3d dgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 3798825666 2396130566 3667453924
conv3d dgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3794173544 2099843274 1201571258
conv3d dgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3794173544 2099843274 2360671465
conv3d dgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 1297934566 3843555714 2551458848
conv3d dgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 1297934566 3843555714 2147657107
conv3d dgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 2962142380 3730143675 2771085644
conv3d dgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 2962142380 3730143675 3242056610
conv3d dgrad_1x8x8x8x32_66x6_32x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha2_beta2 tf32ndhwc_tf32ndhwc_fndhwc_f_f 230909806 4122056936 843165254 1420345119
conv3d wgrad_1x1x3x3x4_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1544571845 1854804847 2980124304 2713669702
conv3d wgrad_1x1x3x3x4_13x3_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1544571845 1854804847 2980124304 2713669702
conv3d wgrad_1x1x1x8x4_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3007342694 1782345730 294738383 3475727547
conv3d wgrad_1x1x1x8x4_33x8_8x1x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3007342694 1782345730 294738383 947267570
conv3d wgrad_1x8x8x8x4_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 838246671 2681206785 1138813722 824075861
conv3d wgrad_1x8x8x8x4_88x8_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 838246671 2681206785 1138813722 82060253
conv3d wgrad_1x16x16x16x4_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 1260894714 1138813722 3511262600
conv3d wgrad_1x16x16x16x4_1616x16_8x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 1260894714 1138813722 4001643207
conv3d wgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1644441141 1631191071 4010744414 942007202
conv3d wgrad_1x1x15x19x160_113x14_224x3x6_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1644441141 1631191071 4010744414 4225324524
conv3d wgrad_1x2x1x1x4_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 238174184 2768167245 1585402383 4211777251
conv3d wgrad_1x2x1x1x4_11x1_8x1x1_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 238174184 2768167245 1585402383 3750079405
conv3d wgrad_1x1x7x7x4_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3595246799 1159024946 2695215306 4166286345
conv3d wgrad_1x1x7x7x4_15x5_16x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 3595246799 1159024946 2695215306 614099477
conv3d wgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4058682611 2837532843 1761528323 549885623
conv3d wgrad_1x11x15x19x64_1215x20_32x3x6_pad_d1h1w3_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4058682611 2837532843 1761528323 2965474394
conv3d wgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 3423607562 3608965793 2798805760
conv3d wgrad_1x32x32x32x16_1616x16_32x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 3423607562 3608965793 1941621355
conv3d wgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 69226238 2636428043 2649061923
conv3d wgrad_1x16x16x16x32_1616x16_32x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1193322564 69226238 2636428043 3901259858
conv3d wgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 69226238 843165254 902125153
conv3d wgrad_1x16x16x16x32_88x8_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 69226238 843165254 2897689664
conv3d wgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 2962142380 3823648244 1458256611
conv3d wgrad_1x8x8x8x64_88x8_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 4051538848 2962142380 3823648244 479658980
conv3d wgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 2962142380 2396130566 1553657582
conv3d wgrad_1x8x8x8x64_44x4_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 2962142380 2396130566 1843818935
conv3d wgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 1297934566 3626031696 3309140977
conv3d wgrad_1x4x4x4x128_44x4_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2177662229 1297934566 3626031696 3877168474
conv3d wgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 1811285868 3626031696 2959655816
conv3d wgrad_1x8x8x8x128_88x8_128x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 1811285868 3626031696 2478179322
conv3d wgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3595579175 3823648244 1409929324
conv3d wgrad_1x16x16x16x64_1616x16_64x3x3_pad_d1h1w1_stride_d1h1w1_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3595579175 3823648244 3283749403
conv3d wgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3423607562 357908110 3763482552
conv3d wgrad_1x32x32x32x16_1616x16_64x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 2614793891 3423607562 357908110 984484147
conv3d wgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_corr_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 69226238 4105258568 3342929921
conv3d wgrad_1x16x16x16x32_88x8_128x2x2_pad_d0h0w0_stride_d2h2w2_dil_d1h1w1_conv_alpha1_beta0 tf32ndhwc_tf32ndhwc_fndhwc_f_f 1329805353 69226238 4105258568 893600736
conv3d wgrad_1x8x8x8x32_66x6_32x3x3_pad_d0h0w0_stride_d1h1w1_dil_d1h1w1_corr_alpha2_beta2 tf32ndhwc_tf32ndhwc_fndhwc_f_f 230909806 1260894714 2636428043 2198733997

View File

@ -0,0 +1,138 @@
conv2d fprop_1x1x1x16_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 776637956 2909557486 4209557191 2628681889
conv2d fprop_1x1x1x16_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 776637956 2909557486 4209557191 2628681889
conv2d fprop_1x1x8x16_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 4082436958 2547545036 3324685530 3597206714
conv2d fprop_1x1x8x16_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 4082436958 2547545036 3324685530 1585522588
conv2d fprop_1x7x8x16_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3137973937 2767077290 1907827554 2051304566
conv2d fprop_1x7x8x16_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3137973937 2767077290 1907827554 374967253
conv2d fprop_1x7x9x16_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 655725974 3592472200 506563703 1674820694
conv2d fprop_1x7x9x16_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 655725974 3592472200 506563703 3975853358
conv2d fprop_2x7x9x16_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 725233472 3683589771 493841232 304963909
conv2d fprop_2x7x9x16_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 725233472 3683589771 493841232 564533608
conv2d fprop_3x7x9x16_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2099667058 3573646278 1206332722 7205531
conv2d fprop_3x7x9x16_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2099667058 3573646278 1206332722 3794965864
conv2d fprop_3x7x9x16_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2099667058 3329730583 1710685046 3598855498
conv2d fprop_3x7x9x16_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2099667058 3329730583 1710685046 3145627823
conv2d fprop_3x7x9x16_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2099667058 817147799 3026961444 1414034801
conv2d fprop_3x7x9x16_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2099667058 817147799 3026961444 2252310527
conv2d fprop_1x11x7x16_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1291281134 2909557486 3324685530 2255601108
conv2d fprop_1x11x7x16_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1291281134 2909557486 3324685530 2255601108
conv2d fprop_1x11x7x16_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1291281134 2767077290 3324685530 1579121635
conv2d fprop_1x11x7x16_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1291281134 2767077290 3324685530 1047334046
conv2d fprop_1x13x11x16_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1759229365 2909557486 1907827554 2852376056
conv2d fprop_1x13x11x16_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1759229365 2909557486 1907827554 2852376056
conv2d fprop_1x17x19x16_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1263288900 1744815467 2720280253 2089128292
conv2d fprop_1x17x19x16_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1263288900 1744815467 2720280253 638322597
conv2d fprop_1x23x5x16_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1511055498 474572393 1710685046 2879179680
conv2d fprop_1x23x5x16_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1511055498 474572393 1710685046 795194450
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3754468132 3475016041 1588474612 3183183520
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3754468132 3475016041 1588474612 3183183520
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3716123936 1149399708 1907179330 1630548311
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3716123936 1149399708 1907179330 1880077064
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1375227342 2508824805 320006437 1729280118
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1375227342 2508824805 320006437 2905577482
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 4026202008 1287566710 1898545094 1486216406
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 4026202008 1287566710 1898545094 2323099205
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2844675317 4066343306 4242252933 2049528680
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2844675317 4066343306 4242252933 823670492
conv2d fprop_1x15x19x48_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 361106642 1568764056 3184621425 2460081734
conv2d fprop_1x15x19x48_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 361106642 1568764056 3184621425 288784852
conv2d fprop_1x16x24x80_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 4020962878 2388318674 3148695436 4074620609
conv2d fprop_1x16x24x80_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 4020962878 2388318674 3148695436 1605237591
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3423715025 4214947574 1328605014 2088140151
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3423715025 4214947574 1328605014 4055269725
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 386898678 2914579947 3231726095 404674518
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 386898678 2914579947 3231726095 404674518
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 401261840 1032488977 2856763908 1755771098
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 401261840 1032488977 2856763908 2984060885
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3490742496 4290221705 2240369427 3419649411
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3490742496 4290221705 2240369427 2709709134
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 674972000 4290221705 936455799 4083729015
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 674972000 4290221705 936455799 521087104
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3559114385 611927961 3672240685 3952711909
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3559114385 611927961 3672240685 831276460
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2456458966 4290221705 2301484646 1300821064
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2456458966 4290221705 2301484646 2700027247
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2456458966 4290221705 2301484646 4025827387
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2456458966 4290221705 2301484646 2458486788
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1536613554 3309037265 3087350413 4020856657
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1536613554 3309037265 3087350413 3244570506
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2165036913 3329730583 612960361 4168246341
conv2d fprop_1x32x32x16_6x16_32x3x3_pad_h1w1_stride_h6w2_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2165036913 3329730583 612960361 2987573285
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2944909811 3592472200 1605228522 3887013673
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 2944909811 3592472200 1605228522 1802699064
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 747123297 2666823963 4290039622 1215151709
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 747123297 2666823963 4290039622 3031516069
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1618850980 1182471718 961406695 372399325
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 1618850980 1182471718 961406695 2003082608
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3643206226 3835297279 520645775 3465036547
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 3643206226 3835297279 520645775 4223629118
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 431903943 1729040908 358345442 4245746659
conv2d fprop_1x233x35x48_233x35_24x7x5_pad_h3w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nhwc_s8nhwc_inhwc_i_f 431903943 1729040908 358345442 1224340034
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 s8nhwc_s8nhwc_inhwc_i_f 4121454290 3081115403 2255344759 3879663798
conv2d fprop_1x1x1x32_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1274533679 3493243764 4209557191 1794065453
conv2d fprop_1x1x1x32_3x3_8x1x1_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1274533679 3493243764 4209557191 1794065453
conv2d fprop_1x1x8x32_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3620204349 4039599338 3324685530 2607282269
conv2d fprop_1x1x8x32_3x8_8x1x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3620204349 4039599338 3324685530 342506690
conv2d fprop_1x7x8x32_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4077428439 1945710027 1907827554 3710378399
conv2d fprop_1x7x8x32_7x8_8x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4077428439 1945710027 1907827554 1781834480
conv2d fprop_1x7x9x32_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2705691693 98103785 506563703 4119696922
conv2d fprop_1x7x9x32_6x8_8x4x4_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2705691693 98103785 506563703 2431904689
conv2d fprop_2x7x9x32_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3097300362 3751678476 493841232 4001455828
conv2d fprop_2x7x9x32_5x7_8x5x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3097300362 3751678476 493841232 1571483249
conv2d fprop_3x7x9x32_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1866766242 2133678546 1206332722 1403098053
conv2d fprop_3x7x9x32_4x7_8x6x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1866766242 2133678546 1206332722 1404854483
conv2d fprop_3x7x9x32_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1866766242 2687010637 1710685046 1600340471
conv2d fprop_3x7x9x32_4x6_8x6x6_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1866766242 2687010637 1710685046 994371582
conv2d fprop_3x7x9x32_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1866766242 1180898714 3026961444 2433465010
conv2d fprop_3x7x9x32_3x5_8x7x7_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1866766242 1180898714 3026961444 285484823
conv2d fprop_1x11x7x32_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4135010890 3493243764 3324685530 4263674457
conv2d fprop_1x11x7x32_6x4_8x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4135010890 3493243764 3324685530 4263674457
conv2d fprop_1x11x7x32_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4135010890 1945710027 3324685530 498513214
conv2d fprop_1x11x7x32_6x4_8x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4135010890 1945710027 3324685530 4201919667
conv2d fprop_1x13x11x32_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 201700668 3493243764 1907827554 922168319
conv2d fprop_1x13x11x32_8x7_8x1x1_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 201700668 3493243764 1907827554 922168319
conv2d fprop_1x17x19x32_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1446981531 3656150002 2720280253 731620572
conv2d fprop_1x17x19x32_9x10_16x2x2_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1446981531 3656150002 2720280253 2646086767
conv2d fprop_1x23x5x32_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2846234135 4032399193 1710685046 3988493390
conv2d fprop_1x23x5x32_12x3_16x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2846234135 4032399193 1710685046 876293908
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3622290451 1505540897 1588474612 3183183520
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3622290451 1505540897 1588474612 3183183520
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3586800483 2619789293 1907179330 1630548311
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3586800483 2619789293 1907179330 1880077064
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 78021249 449214431 320006437 1729280118
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 78021249 449214431 320006437 2905577482
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1731762070 2256228363 1898545094 1486216406
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1731762070 2256228363 1898545094 2323099205
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3184694370 1580258916 4242252933 2049528680
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3184694370 1580258916 4242252933 823670492
conv2d fprop_1x15x19x64_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 311384756 2487637155 3184621425 1268005490
conv2d fprop_1x15x19x64_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 311384756 2487637155 3184621425 4214263209
conv2d fprop_1x16x24x96_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 407775809 1638222167 3148695436 2894438838
conv2d fprop_1x16x24x96_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 407775809 1638222167 3148695436 1246130088
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4006852980 809343331 1328605014 2088140151
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 4006852980 809343331 1328605014 4055269725
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2370365802 4043424400 3231726095 404674518
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2370365802 4043424400 3231726095 404674518
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2744507507 3011298323 2856763908 1755771098
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 2744507507 3011298323 2856763908 2984060885
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1348352570 3581007866 2240369427 3419649411
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1348352570 3581007866 2240369427 2709709134
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1293446836 3581007866 936455799 4083729015
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1293446836 3581007866 936455799 521087104
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3716781942 2056918974 3672240685 3952711909
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3716781942 2056918974 3672240685 831276460
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3230209466 3581007866 2301484646 1300821064
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3230209466 3581007866 2301484646 2700027247
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3230209466 3581007866 2301484646 4025827387
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3230209466 3581007866 2301484646 2458486788
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3752219115 2612889427 3087350413 4020856657
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 3752219115 2612889427 3087350413 3244570506
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 712760952 3656150002 1605228522 3887013673
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 712760952 3656150002 1605228522 1802699064
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1998572675 3327908208 4290039622 1215151709
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1998572675 3327908208 4290039622 3031516069
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1104335117 3889837239 961406695 372399325
conv2d fprop_4x2x3x256_1x1_328x3x5_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 1104335117 3889837239 961406695 2003082608
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 260007636 1848202930 520645775 3465036547
conv2d fprop_1x124x224x96_229x129_24x7x7_pad_h3w3_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nhwc_s4nhwc_inhwc_i_f 260007636 1848202930 520645775 4223629118
conv2d fprop_1x17x11x288_17x11_160x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha2_beta2 s4nhwc_s4nhwc_inhwc_i_f 2451612476 2037530725 2255344759 3879663798

View File

@ -0,0 +1,128 @@
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2257020387 2306573932 56677867 1786106543
conv2d fprop_1x15x19x160_15x19_224x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2257020387 2306573932 56677867 1786106543
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1156972542 2907159083 2175481248 3712392696
conv2d fprop_1x19x37x160_10x19_224x3x3_pad_h1w1_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1156972542 2907159083 2175481248 4128818508
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3622914431 360329309 1000827686 3397816796
conv2d fprop_1x16x16x160_17x16_224x2x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3622914431 360329309 1000827686 4023952937
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 333387085 3931688998 1579688492 2803910439
conv2d fprop_1x23x21x128_23x21_224x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 333387085 3931688998 1579688492 3489895425
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2517840716 1167172924 941948898 854314410
conv2d fprop_1x29x37x160_29x37_224x5x5_pad_h2w2_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2517840716 1167172924 941948898 1777561699
conv2d fprop_1x15x19x64_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 993960861 2689618577 345208683 1561585450
conv2d fprop_1x15x19x64_15x19_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 993960861 2689618577 345208683 2857545178
conv2d fprop_1x16x24x96_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2390973039 3400735473 1409384107 1984034023
conv2d fprop_1x16x24x96_16x24_96x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2390973039 3400735473 1409384107 2037481465
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1491809625 4124099354 4139509970 978245698
conv2d fprop_1x13x16x288_7x8_160x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1491809625 4124099354 4139509970 3910925680
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 272928955 1481031949 3330491456 111364403
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 272928955 1481031949 3330491456 111364403
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 401261840 318138824 1323519634 3290313862
conv2d fprop_1x71x80x32_36x40_64x5x5_pad_h2w2_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 401261840 318138824 1323519634 3540214472
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 465953721 1662236565 1710006728 3977590264
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 465953721 1662236565 1710006728 3361009847
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2643174311 1662236565 1815140928 3586291526
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2643174311 1662236565 1815140928 726840541
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 4293764010 4142851469 1225898575 3671738402
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 4293764010 4142851469 1225898575 1183585862
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1437928962 1662236565 3221182201 980724445
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1437928962 1662236565 3221182201 1864754285
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1437928962 1662236565 3221182201 520312359
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 1437928962 1662236565 3221182201 2915637276
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2058879935 3902389594 1882642169 1604948913
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2058879935 3902389594 1882642169 4198560030
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2944909811 3226488785 3103396187 1821576460
conv2d fprop_32x24x32x32_24x31_32x1x2_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2944909811 3226488785 3103396187 1178412803
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 844345223 3833205704 2120200862 3212986739
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 844345223 3833205704 2120200862 426277367
conv2d fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2680465245 2224844652 1189066576 2095234196
conv2d fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2680465245 2224844652 1189066576 2095234196
conv2d fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2680465245 3330175594 2327522013 4239788654
conv2d fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2680465245 3330175594 2327522013 4239788654
conv2d fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2680465245 2942065884 2327522013 2474295423
conv2d fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2680465245 2942065884 2327522013 2015087380
conv2d fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2494788361 673559002 2327522013 2262256181
conv2d fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2494788361 673559002 2327522013 2262256181
conv2d fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2494788361 1481031949 2522097906 1586033176
conv2d fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2494788361 1481031949 2522097906 1586033176
conv2d fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2494788361 2508231365 3519987931 2139994607
conv2d fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2494788361 2508231365 3519987931 2139994607
conv2d fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3118588240 2407183407 3519987931 2315728838
conv2d fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3118588240 2407183407 3519987931 3439977625
conv2d fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3118588240 3633353507 2522097906 1293871809
conv2d fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3118588240 3633353507 2522097906 1293871809
conv2d fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3830854792 594370640 3519987931 1641417207
conv2d fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3830854792 594370640 3519987931 1641417207
conv2d fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3830854792 415008779 2163698124 1309114882
conv2d fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3830854792 415008779 2163698124 1309114882
conv2d fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3830854792 3137005789 1648179354 57450329
conv2d fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3830854792 3137005789 1648179354 57450329
conv2d fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 901927536 3144319670 1648179354 2433410615
conv2d fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 901927536 3144319670 1648179354 1242210609
conv2d fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 901927536 1994427383 2163698124 4149927306
conv2d fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 901927536 1994427383 2163698124 4149927306
conv2d fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2446540417 1805451200 1648179354 2061091838
conv2d fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2446540417 1805451200 1648179354 2061091838
conv2d fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2446540417 1160209190 4271553919 4158225587
conv2d fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2446540417 1160209190 4271553919 4158225587
conv2d fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2446540417 3270127523 3766582212 2050622635
conv2d fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 2446540417 3270127523 3766582212 2050622635
conv2d fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 673124514 2964077129 3766582212 540078333
conv2d fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 673124514 2964077129 3766582212 1459986551
conv2d fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 673124514 162466699 4271553919 4229033905
conv2d fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 673124514 162466699 4271553919 4229033905
conv2d fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3790854543 1740163851 3766582212 666611661
conv2d fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s8nc32hw32_s8c32rsk32_s8nc32hw32_i_f 3790854543 1740163851 3766582212 666611661
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3563756534 4145401287 2774147186 516022831
conv2d fprop_1x55x51x256_28x26_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3563756534 4145401287 2774147186 516022831
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2958274559 2084126045 1988418915 2830875772
conv2d fprop_1x27x23x256_9x7_512x3x3_pad_h0w0_stride_h3w3_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2958274559 2084126045 1988418915 3488898477
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1464005709 2084126045 4276149125 1229313578
conv2d fprop_1x27x31x256_12x11_512x3x3_pad_h5w7_stride_h3w4_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1464005709 2084126045 4276149125 1822992361
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3218517333 2442721868 2671270533 2371226722
conv2d fprop_1x27x35x256_15x9_512x7x5_pad_h11w7_stride_h3w5_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3218517333 2442721868 2671270533 1280057593
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1354370892 2084126045 4193566385 2927747028
conv2d fprop_1x27x27x256_27x14_512x3x3_pad_h1w1_stride_h1w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1354370892 2084126045 4193566385 1389616458
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1354370892 2084126045 4193566385 1186086047
conv2d fprop_1x27x27x256_14x27_512x3x3_pad_h1w1_stride_h2w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1354370892 2084126045 4193566385 929529143
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2304806251 3157706556 3303866450 1115195627
conv2d fprop_3x28x28x256_14x14_256x2x2_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2304806251 3157706556 3303866450 1898128533
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2637544259 2993513863 3602417067 2435518052
conv2d fprop_4x4x5x128_3x3_256x3x6_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2637544259 2993513863 3602417067 173672416
conv2d fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3301525734 2221050180 2689662309 2294233865
conv2d fprop_1x56x56x64_56x56_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3301525734 2221050180 2689662309 2294233865
conv2d fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3301525734 98103785 2280943499 2499302634
conv2d fprop_1x56x56x64_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3301525734 98103785 2280943499 2499302634
conv2d fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3301525734 1677636452 2280943499 2796886958
conv2d fprop_1x56x56x64_56x56_64x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3301525734 1677636452 2280943499 1708111283
conv2d fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1130520359 59038063 2280943499 2620671899
conv2d fprop_1x56x56x256_56x56_64x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1130520359 59038063 2280943499 2620671899
conv2d fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1130520359 4145401287 1219103855 3961007091
conv2d fprop_1x56x56x256_28x28_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1130520359 4145401287 1219103855 3961007091
conv2d fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1130520359 504379703 1488928479 1427134856
conv2d fprop_1x56x56x256_28x28_128x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1130520359 504379703 1488928479 1427134856
conv2d fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 899899803 1505875757 1488928479 396727280
conv2d fprop_1x28x28x128_28x28_128x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 899899803 1505875757 1488928479 614758331
conv2d fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 899899803 1730326830 1219103855 2571923929
conv2d fprop_1x28x28x128_28x28_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 899899803 1730326830 1219103855 2571923929
conv2d fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 816701080 1375821331 1488928479 4192533639
conv2d fprop_1x28x28x512_28x28_128x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 816701080 1375821331 1488928479 4192533639
conv2d fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 816701080 1276141125 806482633 3315974235
conv2d fprop_1x28x28x512_14x14_1024x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 816701080 1276141125 806482633 3315974235
conv2d fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 816701080 1201032911 1764365805 2880519032
conv2d fprop_1x28x28x512_14x14_256x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 816701080 1201032911 1764365805 2880519032
conv2d fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2248088895 3515084013 1764365805 2795451116
conv2d fprop_1x14x14x256_14x14_256x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2248088895 3515084013 1764365805 3995792090
conv2d fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2248088895 2239379728 806482633 3653954546
conv2d fprop_1x14x14x256_14x14_1024x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 2248088895 2239379728 806482633 3653954546
conv2d fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 4171891827 3739025576 1764365805 3540733588
conv2d fprop_1x14x14x1024_14x14_256x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 4171891827 3739025576 1764365805 3540733588
conv2d fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 4171891827 4128795926 2366524779 2258473990
conv2d fprop_1x14x14x1024_7x7_2048x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 4171891827 4128795926 2366524779 2258473990
conv2d fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 4171891827 3574788779 1867333940 3661997755
conv2d fprop_1x14x14x1024_7x7_512x1x1_pad_h0w0_stride_h2w2_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 4171891827 3574788779 1867333940 3661997755
conv2d fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1843516393 560338949 1867333940 512869068
conv2d fprop_1x7x7x512_7x7_512x3x3_pad_h1w1_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1843516393 560338949 1867333940 147207245
conv2d fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1843516393 1545827399 2366524779 2494918310
conv2d fprop_1x7x7x512_7x7_2048x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 1843516393 1545827399 2366524779 2494918310
conv2d fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_corr_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3623215010 2231173245 1867333940 1230240181
conv2d fprop_1x7x7x2048_7x7_512x1x1_pad_h0w0_stride_h1w1_dil_h1w1_conv_alpha1_beta0 s4nc64hw64_s4c64rsk64_s4nc64hw64_i_f 3623215010 2231173245 1867333940 1230240181

View File

@ -22,6 +22,7 @@
cutlass_test_unit_add_executable(
cutlass_test_unit_epilogue_thread
activation.cu
linear_combination.cu
linear_combination_planar_complex.cu
)

View File

@ -0,0 +1,314 @@
/***************************************************************************************************
* Copyright (c) 2017-2021, NVIDIA CORPORATION. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without modification, are permitted
* provided that the following conditions are met:
* * Redistributions of source code must retain the above copyright notice, this list of
* conditions and the following disclaimer.
* * Redistributions in binary form must reproduce the above copyright notice, this list of
* conditions and the following disclaimer in the documentation and/or other materials
* provided with the distribution.
* * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used
* to endorse or promote products derived from this software without specific prior written
* permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
* FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
* OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*
**************************************************************************************************/
/*! \file
\brief Unit tests for thread-level GEMM
*/
#include "../../common/cutlass_unit_test.h"
#include "cutlass/epilogue/thread/activation.h"
#include "cutlass/util/host_tensor.h"
/////////////////////////////////////////////////////////////////////////////////////////////////
template <typename T, int N, typename Func>
__global__ void test_Epilogue_thread_activation(T *out, T *in) {
cutlass::Array<T, N> *vec_out = reinterpret_cast<cutlass::Array<T, N> *>(out);
cutlass::Array<T, N> *vec_in = reinterpret_cast<cutlass::Array<T, N> *>(in);
Func func;
vec_out[threadIdx.x] = func(vec_in[threadIdx.x]);
}
/////////////////////////////////////////////////////////////////////////////////////////////////
//
// Reference
//
static double GELU_golden_input[] = {
1.587425827980, 1.157652974129, 0.750432848930, -0.965980410576,
-0.388184845448, 0.014422321692, 0.353164494038, 1.354383468628,
0.167588576674, 0.272798538208, -0.377032428980, 1.923444747925,
0.308164477348, -0.341318070889, 0.278338819742, -0.292668998241,
-1.051743745804, -0.814175724983, 0.112737402320, 1.262938618660,
-1.582363605499, 0.722016870975, 1.053453564644, -0.659764587879,
0.734917521477, 0.091274201870, 0.604461073875, -0.219043627381,
-0.136795744300, 0.960650205612, -1.805408835411, 0.091029644012,
-1.023343324661, 0.147713735700, -0.499895423651, 1.351878166199,
-1.631091356277, -0.336171895266, -1.612408638000, 0.090832948685,
-0.658132910728, -0.326727777719, -1.986387014389, 0.787685871124,
-1.015677452087, -0.225094825029, 0.876752018929, 0.744826257229,
0.870290279388, -0.757595360279, 1.510331749916, 0.750012576580,
0.906444966793, -0.915759027004, 1.260277032852, -0.158465340734,
-0.109191477299, -0.817102134228, 0.391305118799, -0.524910449982,
0.351349592209, 0.801979541779, 0.446691334248, -0.741077482700,
1.205966711044, -0.910210072994, 0.945986449718, 0.784096539021,
1.670521497726, 0.344931513071, -0.301411420107, 0.309870749712,
-0.879704594612, -1.951189517975, -0.805817663670, -0.661812782288,
-0.505914270878, -1.836273789406, -0.381845980883, -0.554707705975,
-0.375447630882, -0.516645610332, 0.509586095810, 1.087131023407,
2.664817094803, -1.558295488358, -0.076461032033, -0.504621028900,
1.327111959457, -1.819981694221, 1.350415468216, -2.074112653732,
1.501431345940, -1.339013576508, 0.162817999721, -1.473457217216,
0.357770472765, 0.188413277268, 1.601302266121, -0.653882205486,
0.856162548065, 0.763102591038, -0.526283502579, 0.581961452961,
0.089969776571, 1.968745589256, 0.545802056789, -1.168786048889,
1.206663012505, -0.109096683562, -1.223938226700, 0.744599223137,
-1.779406785965, 0.766436159611, -0.579044401646, -1.002057313919,
-0.715845823288, -0.562508940697, 0.886768460274, 2.327786445618,
-0.148763969541, -0.918884515762, -0.367678701878, -1.105021238327,
-0.461237311363, 0.158228352666, -0.254040330648, 1.427477598190,
0.277530491352, 0.046293262392, -0.535557329655, -1.486695051193,
-0.953706681728, -1.040495038033, -0.314667612314, 0.348172843456,
0.522773325443, 0.025960063562, -0.482472360134, 1.993084549904,
-0.253064930439, -0.012146313675, -2.166327714920, 0.398040622473,
-0.022238900885, -0.443580865860, -0.898376941681, -0.571689844131,
1.666979670525, -0.831176340580, -0.671057403088, 0.481970995665,
-1.096243023872, -1.493894338608, 0.596651911736, -0.229505166411,
1.165976166725, 0.905094027519, 0.049716457725, -1.362933635712,
-0.366948783398, 1.461613893509, -0.718411505222, 0.895385026932,
-0.763122260571, 1.329716682434, 1.366570711136, -0.086544901133,
0.059739742428, 0.940766513348, -0.272854357958, -1.738811373711,
-0.361239165068, 0.696977972984, 1.288442254066, 1.264815807343,
-0.573566436768, -1.141678214073, 0.081865988672, -0.886228799820,
-0.236933603883, 1.050115466118, -0.538952171803, 0.651773929596,
-0.220034509897, -1.198960781097, 1.247478365898, -0.053529661149,
0.639809548855, 1.672434806824, 0.511088073254, -1.179364681244,
-0.730427742004, 0.157630980015, 0.389369845390, -0.925578773022,
-0.093250080943, -0.391062080860, 0.852983593941, 1.868778109550,
-1.198786258698, 0.604997038841, -1.482687234879, -2.469333171844,
0.718807697296, -0.559609353542, 2.187228441238, -2.927527904510,
0.148535788059, -0.097280368209, 0.674131810665, -1.137645959854,
0.792729616165, -1.166317462921, -0.498791724443, 1.675866723061,
-0.137909621000, -0.653263568878, -2.281216144562, 0.296096831560,
2.002410173416, 1.083609819412, 0.933580815792, -1.504760265350,
2.185185909271, 0.286121010780, -1.035485863686, -0.216372340918,
-0.274334043264, -0.849510788918, -1.397169828415, -0.407644748688,
0.159476816654, -0.170650705695, 0.335193097591, -0.156852483749,
0.036168430001, 0.858105242252, -1.086121797562, 0.404813349247,
-0.481496721506, -0.389882832766, 0.020690204576, -0.772020936012,
-0.758921504021, 0.323482036591, 0.115715265274, -0.811228036880,
-0.882436633110, 0.176811277866, 1.678015947342, 0.379081040621,
-0.842976212502, 0.346952259541, -0.545828759670, 1.632800459862
};
static double GELU_golden_output[] = {
1.498199582100, 1.014679551125, 0.580462038517, -0.161344811320,
-0.135453075171, 0.007294139825, 0.225325092673, 1.235459089279,
0.094946734607, 0.165724009275, -0.133120641112, 1.871103763580,
0.191376730800, -0.125069886446, 0.169681981206, -0.112644664943,
-0.154036879539, -0.169163048267, 0.061428427696, 1.132469892502,
-0.089851818979, 0.552240371704, 0.899579226971, -0.168043658137,
0.565008401871, 0.048956073821, 0.439583092928, -0.090532489121,
-0.060955654830, 0.798911273479, -0.064101703465, 0.048816055059,
-0.156645998359, 0.082529976964, -0.154254898429, 1.232632875443,
-0.083896033466, -0.123835846782, -0.086161509156, 0.048703473061,
-0.167972877622, -0.121522113681, -0.046670529991, 0.617986679077,
-0.157319813967, -0.092503339052, 0.709896743298, 0.574865520000,
0.703132867813, -0.169963955879, 1.411436080933, 0.580042064190,
0.741154611111, -0.164741978049, 1.129479527473, -0.069256491959,
-0.049848672003, -0.169087052345, 0.255214750767, -0.157380074263,
0.223928079009, 0.632535398006, 0.300378054380, -0.169946283102,
1.068588852882, -0.165071934462, 0.783203184605, 0.614346146584,
1.591325283051, 0.219006344676, -0.115003645420, 0.192637458444,
-0.166712537408, -0.049788996577, -0.169361919165, -0.168130636215,
-0.155041679740, -0.060888241976, -0.134137839079, -0.160614117980,
-0.132782235742, -0.156389534473, 0.354075312614, 0.936574816704,
2.654553413391, -0.092845752835, -0.035900454968, -0.154874503613,
1.204704761505, -0.062572605908, 1.230982899666, -0.039479542524,
1.401402950287, -0.120890334249, 0.091938301921, -0.103604510427,
0.228880971670, 0.108285568655, 1.513783097267, -0.167782157660,
0.688394129276, 0.593158841133, -0.157540664077, 0.418839782476,
0.048209801316, 1.920528769493, 0.386099845171, -0.141709372401,
1.069367766380, -0.049809500575, -0.135230198503, 0.574639260769,
-0.066881760955, 0.596510827541, -0.162873372436, -0.158483341336,
-0.169686436653, -0.161375194788, 0.720409095287, 2.304597616196,
-0.065585561097, -0.164551988244, -0.131098195910, -0.148708447814,
-0.148663327098, 0.089060656726, -0.101548098028, 1.317959904671,
0.169103100896, 0.024001283571, -0.158595800400, -0.101909510791,
-0.162240833044, -0.155090972781, -0.118474565446, 0.221488356590,
0.365645468235, 0.013248858973, -0.151851043105, 1.946992278099,
-0.101253561676, -0.006014300976, -0.032804865390, 0.260597169399,
-0.010922161862, -0.145792976022, -0.165743649006, -0.162226170301,
1.587365984917, -0.168676435947, -0.168497130275, 0.330191940069,
-0.149622067809, -0.100989677012, 0.432351946831, -0.093922272325,
1.023946166039, 0.739726305008, 0.025843897834, -0.117827951908,
-0.130937814713, 1.356489539146, -0.169726014137, 0.729478538036,
-0.169943705201, 1.207641005516, 1.249209761620, -0.040288090706,
0.031292784959, 0.777626037598, -0.107090584934, -0.071350336075,
-0.129670530558, 0.527676224709, 1.161149263382, 1.134579420090,
-0.162394225597, -0.144757837057, 0.043603736907, -0.166386902332,
-0.096278958023, 0.895924389362, -0.158969298005, 0.484089732170,
-0.090857118368, -0.138206124306, 1.115107178688, -0.025622237474,
0.472724437714, 1.593463659286, 0.355387806892, -0.140493586659,
-0.169871479273, 0.088687323034, 0.253673940897, -0.164135158062,
-0.043161027133, -0.136040985584, 0.685087263584, 1.811169505119,
-0.138226687908, 0.440080583096, -0.102422207594, -0.016713079065,
0.549075841904, -0.161096408963, 2.155813455582, -0.005001218989,
0.083037458360, -0.044870752841, 0.505522191525, -0.145202502608,
0.623111069202, -0.141991063952, -0.154108211398, 1.597298502922,
-0.061391282827, -0.167753636837, -0.025704355910, 0.182520583272,
1.957115054131, 0.932696640491, 0.769961357117, -0.099604383111,
2.153636932373, 0.175279796124, -0.155551761389, -0.089653611183,
-0.107515335083, -0.168032020330, -0.113423995674, -0.139319628477,
0.089841812849, -0.073763631284, 0.211594089866, -0.068651281297,
0.018605981022, 0.690416753292, -0.150658726692, 0.266040354967,
-0.151710823178, -0.135800719261, 0.010515870526, -0.169883996248,
-0.169960290194, 0.202769815922, 0.063187584281, -0.169236257672,
-0.166577890515, 0.100812792778, 1.599699616432, 0.245525524020,
-0.168275654316, 0.220552831888, -0.159705042839, 1.549110531807
};
/////////////////////////////////////////////////////////////////////////////////////////////////
TEST(Epilogue_thread_gelu_taylor, device_f32) {
int const kN = 256;
int const kV = 4;
using Element = float;
using Func = cutlass::epilogue::thread::GELU_taylor<cutlass::Array<Element, kV>>;
double tolerance = 0.005;
//
// Construct workspace
//
cutlass::HostTensor<Element, cutlass::layout::RowMajor> tensor_Destination({1, kN});
cutlass::HostTensor<Element, cutlass::layout::RowMajor> tensor_Source({1, kN});
for (int i = 0; i < kN; ++i) {
tensor_Source.host_data(i) = Element(GELU_golden_input[i]);
}
tensor_Destination.sync_device();
tensor_Source.sync_device();
//
// Launch the kernel
//
dim3 grid(1,1,1);
dim3 block(kN / kV, 1, 1);
test_Epilogue_thread_activation<Element, kV, Func><<< grid, block >>>(
tensor_Destination.device_data(),
tensor_Source.device_data());
tensor_Destination.sync_host();
//
// Verify
//
for (int i = 0; i < kN; ++i) {
Element input = Element(GELU_golden_input[i]);
Element got = tensor_Destination.host_data(i);
Element expected = Element(GELU_golden_output[i]);
double rel_error = (double(got) - double(expected)) / double(expected);
double tolerance_override = tolerance;
switch (i) {
case 142: tolerance_override = 0.008; break;
case 203: tolerance_override = 0.03; break;
case 207: tolerance_override = 0.09; break;
case 218: tolerance_override = 0.013; break;
}
EXPECT_LT(std::abs(rel_error), tolerance_override)
<< "Input[" << i << "]: " << input << ", Got: " << got << ", expected: " << expected;
}
}
/////////////////////////////////////////////////////////////////////////////////////////////////
TEST(Epilogue_thread_gelu_taylor, device_f16) {
int const kN = 256;
int const kV = 8;
using Element = cutlass::half_t;
using Func = cutlass::epilogue::thread::GELU_taylor<cutlass::Array<Element, kV>>;
double tolerance = 0.005;
//
// Construct workspace
//
cutlass::HostTensor<Element, cutlass::layout::RowMajor> tensor_Destination({1, kN});
cutlass::HostTensor<Element, cutlass::layout::RowMajor> tensor_Source({1, kN});
for (int i = 0; i < kN; ++i) {
tensor_Source.host_data(i) = Element(GELU_golden_input[i]);
}
tensor_Destination.sync_device();
tensor_Source.sync_device();
//
// Launch the kernel
//
dim3 grid(1,1,1);
dim3 block(kN / kV, 1, 1);
test_Epilogue_thread_activation<Element, kV, Func><<< grid, block >>>(
tensor_Destination.device_data(),
tensor_Source.device_data());
tensor_Destination.sync_host();
//
// Verify
//
for (int i = 0; i < kN; ++i) {
Element input = Element(GELU_golden_input[i]);
Element got = tensor_Destination.host_data(i);
Element expected = Element(GELU_golden_output[i]);
double rel_error = (double(got) - double(expected)) / double(expected);
double tolerance_override = tolerance;
switch (i) {
case 36: tolerance_override = 0.006; break;
case 77: tolerance_override = 0.009; break;
case 95: tolerance_override = 0.008; break;
case 112: tolerance_override = 0.007; break;
case 171: tolerance_override = 0.006; break;
case 203: tolerance_override = 0.03; break;
case 207: tolerance_override = 0.15; break;
}
EXPECT_LT(std::abs(rel_error), tolerance_override)
<< "Input[" << i << "]: " << input << ", Got: " << got << ", expected: " << expected;
}
}
/////////////////////////////////////////////////////////////////////////////////////////////////

View File

@ -159,3 +159,41 @@ TEST(Epilogue_thread_linear_combination_gelu, device_side_f16_f16_ptr) {
}
/////////////////////////////////////////////////////////////////////////////////////////////////
TEST(Epilogue_thread_linear_combination_gelu_taylor, device_side_f16_f16_ptr) {
using Element = cutlass::half_t;
using ElementOutput = cutlass::half_t;
int const kCount = 8;
using LinearCombinationGELU = cutlass::epilogue::thread::LinearCombinationGELU<
ElementOutput,
kCount,
Element,
Element>;
Element alpha = Element(1);
Element beta = Element(0);
typename LinearCombinationGELU::Params params(&alpha, &beta);
LinearCombinationGELU linear_combination_op(params);
cutlass::Array<Element, kCount> accum;
for (int i = 0; i < kCount; ++i) {
accum[i] = Element((float)i * 0.3f);
}
cutlass::Array<ElementOutput, kCount> destination = linear_combination_op(accum, accum);
cutlass::epilogue::thread::GELU<ElementOutput> gelu_func;
for (int i = 0; i < kCount; ++i) {
ElementOutput expected = gelu_func(accum[i]);
ElementOutput got = destination[i];
EXPECT_TRUE(expected == got);
}
}
/////////////////////////////////////////////////////////////////////////////////////////////////

View File

@ -51,7 +51,6 @@
#include "cutlass/matrix_coord.h"
#include "cutlass/tensor_coord.h"
#include "cutlass/layout/tensor.h"
#include "cutlass/gemm/gemm.h"
#include "cutlass/conv/convolution.h"
#include "cutlass/conv/conv2d_problem_size.h"

View File

@ -162,10 +162,11 @@ def CreateConv2dOperator(manifest, layout, tile_descriptions, data_type, alignme
# iterator algorithm (analytic and optimized)
iterator_algorithms = [IteratorAlgorithm.Analytic, IteratorAlgorithm.Optimized]
# by default, only generate the largest tile size
# by default, only generate the largest tile size, largest alignment, and optimized iterator
if manifest.args.kernels == '':
tile_descriptions = [tile_descriptions[0],]
alignment_constraints = [alignment_constraints[0],]
iterator_algorithms = [IteratorAlgorithm.Optimized]
operations = []
@ -212,12 +213,21 @@ def CreateConv2dOperator(manifest, layout, tile_descriptions, data_type, alignme
# better for problem sizes with large activation channel count
swizzling_functor_strided_dgrad_ = SwizzlingFunctor.StridedDgradIdentity1
new_operation = Conv2dOperation(ConvKind.Dgrad, IteratorAlgorithm.Analytic, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided, epilogue_functor, swizzling_functor_strided_dgrad_)
if IteratorAlgorithm.Analytic in iterator_algorithms:
new_operation = Conv2dOperation(ConvKind.Dgrad, IteratorAlgorithm.Analytic, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided, epilogue_functor, swizzling_functor_strided_dgrad_)
manifest.append(new_operation)
operations.append(new_operation)
manifest.append(new_operation)
operations.append(new_operation)
# Strided support for Optimized Dgrad
if IteratorAlgorithm.Optimized in iterator_algorithms:
new_operation = Conv2dOperation(ConvKind.Dgrad, IteratorAlgorithm.Optimized, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided, epilogue_functor, swizzling_functor_strided_dgrad_)
manifest.append(new_operation)
operations.append(new_operation)
#
# Conv2d Wgrad
#
@ -246,34 +256,70 @@ def CreateConv3dOperator(manifest, layout, tile_descriptions, data_type, alignme
# iterator algorithm (analytic and optimized)
iterator_algorithms = [IteratorAlgorithm.Analytic, IteratorAlgorithm.Optimized]
# by default, only generate the largest tile size
# by default, only generate the largest tile size and optimized iterators
if manifest.args.kernels == '':
tile_descriptions = [tile_descriptions[0],]
iterator_algorithms = [IteratorAlgorithm.Optimized]
operations = []
# All tile sizes for Conv3dFprop and Conv3dWgrad
for tile in tile_descriptions:
for conv_kind in conv_kinds:
A = TensorDescription(element_a, layout, alignment)
B = TensorDescription(element_b, layout, alignment)
C = TensorDescription(element_c, layout, alignment_c)
#
# Conv3d Fprop
#
if ConvKind.Fprop in conv_kinds:
# Strided support for Analytic and Optimized Fprop
for iterator_algorithm in iterator_algorithms:
A = TensorDescription(element_a, layout, alignment)
B = TensorDescription(element_b, layout, alignment)
C = TensorDescription(element_c, layout, alignment_c)
# optimized conv3d iterator algorithm is only for Wgrad
if (iterator_algorithm == IteratorAlgorithm.Optimized) \
and ((conv_kind == ConvKind.Fprop) or (conv_kind == ConvKind.Dgrad)):
continue
# strided support for Fprop (Analytic/Optimized), Dgrad (Analytic), and Wgrad (Analytic)
new_operation = Conv3dOperation(conv_kind, iterator_algorithm, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided, epilogue_functor)
new_operation = Conv3dOperation(ConvKind.Fprop, iterator_algorithm, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided)
manifest.append(new_operation)
operations.append(new_operation)
#
# Conv3d Wgrad
#
if ConvKind.Wgrad in conv_kinds:
# Strided support for Analytic and Optimized Wgrad
for iterator_algorithm in iterator_algorithms:
new_operation = Conv3dOperation(ConvKind.Wgrad, iterator_algorithm, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided, epilogue_functor)
manifest.append(new_operation)
operations.append(new_operation)
# All tile sizes for Conv3dDgrad
for tile in tile_descriptions:
A = TensorDescription(element_a, layout, alignment)
B = TensorDescription(element_b, layout, alignment)
C = TensorDescription(element_c, layout, alignment_c)
#
# Conv3d Dgrad
#
if ConvKind.Dgrad in conv_kinds:
# Unity stride for Optimized Dgrad
new_operation = Conv3dOperation(ConvKind.Dgrad, IteratorAlgorithm.Optimized, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Unity, epilogue_functor)
manifest.append(new_operation)
operations.append(new_operation)
# Strided support for Analytic Dgrad
# Conv3dDgrad has a naive strided support which does not cut down redundant MMAs
new_operation = Conv3dOperation(ConvKind.Dgrad, IteratorAlgorithm.Analytic, tile.minimum_compute_capability, tile,\
A, B, C, element_epilogue, StrideSupport.Strided, epilogue_functor)
manifest.append(new_operation)
operations.append(new_operation)
return operations
###################################################################################################
###################################################################################################
@ -1158,7 +1204,7 @@ def GenerateSM75_TensorOp_88128(manifest, args):
data_type = [DataType.b1, DataType.b1, DataType.s32, DataType.s32]
CreateGemmOperator(manifest, layouts, tile_descriptions, \
data_type, alignment_constraints, None, EpilogueFunctor.LinearCombinationClamp)
data_type, alignment_constraints)
#
@ -1934,7 +1980,7 @@ def GenerateSM80_TensorOp_168256(manifest, args):
data_type = [DataType.b1, DataType.b1, DataType.s32, DataType.s32]
CreateGemmOperator(manifest, layouts, tile_descriptions, \
data_type, alignment_constraints, None, EpilogueFunctor.LinearCombinationClamp)
data_type, alignment_constraints)
#

View File

@ -28,7 +28,6 @@
#include "cutlass/cutlass.h"
#include "cutlass/numeric_types.h"
#include "cutlass/complex.h"
#include "cutlass/layout/matrix.h"
#include "cutlass/library/library.h"

View File

@ -34,7 +34,6 @@
#include "cutlass/cutlass.h"
#include "cutlass/library/library.h"
#include "cutlass/library/util.h"
#include "options.h"
/////////////////////////////////////////////////////////////////////////////////////////////////

View File

@ -50,7 +50,6 @@
#include "cutlass/array.h"
#include "cutlass/complex.h"
#include "cutlass/tensor_view.h"
#include "cutlass/util/reference/device/tensor_foreach.h"
#include "cutlass/util/distribution.h"

View File

@ -42,7 +42,6 @@
#include "cutlass/subbyte_reference.h"
#include "cutlass/tensor_view.h"
#include "cutlass/tensor_view_planar_complex.h"
#include "cutlass/util/distribution.h"
#include "tensor_foreach.h"